Spaces:

Rishabh2095
/

AgentWorkflowJobApplications

Sleeping

App Files Files Community

AgentWorkflowJobApplications / src /job_writing_agent /workflow.py

Rishabh2095

Stop tracking job_writer.log

45de167 16 days ago

raw

history blame contribute delete

8.33 kB

	"""Workflow runner and CLI entry point for the job application writer."""

	# Standard library imports
	import asyncio
	import logging
	import os
	import sys
	from datetime import datetime
	from typing import Any

	# Third-party imports
	from langchain_core.tracers import ConsoleCallbackHandler, LangChainTracer
	from langchain_core.runnables import RunnableConfig

	# Local imports
	from job_writing_agent.classes import DataLoadState, NodeName
	from job_writing_agent.graph import build_job_app_graph
	from job_writing_agent.utils.application_cli_interface import handle_cli
	from job_writing_agent.utils.logging.logging_decorators import (
	log_errors,
	log_execution,
	)
	from job_writing_agent.utils.result_utils import print_result, save_result

	logger = logging.getLogger(__name__)


	class JobWorkflow:
	"""
	Workflow orchestrator for the job application writer.

	This class coordinates the execution of the job application writing workflow,
	managing the LangGraph state machine and LangSmith tracing. It follows the
	orchestrator pattern, coordinating multiple subgraphs and nodes without
	implementing business logic itself.

	The workflow consists of:
	1. Data Loading: Parse resume and job description (parallel subgraph)
	2. Research: Company research and relevance filtering (subgraph)
	3. Draft Creation: Generate initial application material
	4. Critique: AI-powered feedback on the draft
	5. Human Approval: User feedback collection
	6. Finalization: Incorporate feedback and produce final output
	"""

	def __init__(self, resume: str, job_description_source: str, content: str):
	"""
	Initialize the JobWorkflow orchestrator.

	Parameters
	----------
	resume: str
	Path to the resume file or resume text.
	job_description_source: str
	URL, file path, or text content of the job description.
	content: str
	Type of application material to generate ("cover_letter", "bullets", "linkedin_note").
	"""
	self.resume = resume
	self.job_description_source = job_description_source
	self.content = content

	def __repr__(self) -> str:
	return (
	f"JobWorkflow(resume={self.resume!r}, "
	f"job_description_source={self.job_description_source!r}, "
	f"content={self.content!r})"
	)

	def _build_initial_workflow_state(self) -> DataLoadState:
	"""
	Get the initial application state for the workflow.

	Returns
	-------
	DataLoadState
	Initialized state dictionary with resume path, job description source,
	content type, and empty messages list.
	"""

	return {
	"resume_path": self.resume,
	"job_description_source": self.job_description_source,
	"content_category": self.content,
	"current_node": "",
	"messages": [],
	"company_research_data": {},
	}

	def _get_callbacks(self) -> list[Any]:
	"""
	Get list of callbacks including LangSmith tracer with enhanced metadata.

	This method creates callback handlers for LangGraph execution, including
	LangSmith tracing with workflow-level metadata and tags for better
	observability and filtering in the LangSmith UI.

	Returns
	-------
	list
	List of callback handlers for LangGraph execution, including:
	- ConsoleCallbackHandler: Console output
	- LangChainTracer: LangSmith tracing (if enabled)
	"""
	callbacks: list[Any] = [ConsoleCallbackHandler()]

	# Add LangSmith tracer if tracing is enabled via environment variable
	if os.getenv("LANGSMITH_TRACING", "").lower() == "true":
	try:
	# LangChainTracer automatically reads from environment variables:
	# - LANGSMITH_API_KEY
	# - LANGSMITH_PROJECT (optional, defaults to "default")
	# - LANGSMITH_ENDPOINT (optional, defaults to https://api.smith.langchain.com)
	langsmith_tracer = LangChainTracer(
	project_name=os.getenv(
	"LANGSMITH_PROJECT", "job_application_writer"
	)
	)
	callbacks.append(langsmith_tracer)
	logger.info("LangSmith tracing enabled with metadata")
	except Exception as e:
	logger.warning(
	f"Failed to initialize LangSmith tracer: {e}. Continuing without tracing."
	)
	else:
	logger.debug(
	"LangSmith tracing is not enabled (LANGSMITH_TRACING != 'true')"
	)

	return callbacks

	def _build_runnable_config(self) -> RunnableConfig:
	"""
	Build RunnableConfig with LangSmith tracing metadata.

	Creates a config with workflow-specific tags, metadata, and callbacks
	for comprehensive observability across all LLM calls.

	Returns
	-------
	RunnableConfig
	Configured for LangSmith tracing with content-specific metadata.
	"""
	current_time = datetime.now()
	thread_id = f"job_workflow_session_{current_time:%Y%m%d%H%M%S}"
	timestamp = current_time.strftime("%Y%m%d-%H%M%S")

	return {
	"configurable": {"thread_id": thread_id},
	"callbacks": self._get_callbacks(),
	"run_name": f"JobAppWorkflow.{self.content}.{timestamp}",
	"metadata": {
	"workflow": "job_application_writer",
	"content_type": self.content,
	"session_id": thread_id,
	},
	"tags": ["job-application-workflow", self.content],
	"recursion_limit": 2,
	}

	@log_execution
	@log_errors
	async def run_workflow(self) -> dict[str, Any] \| None:
	"""
	Execute the complete job application writer workflow.

	This method compiles the graph, configures LangSmith tracing with
	enhanced metadata, and executes the workflow. It handles errors
	gracefully and returns the final state or None if execution fails.

	Returns
	-------
	Optional[Dict[str, Any]]
	Final workflow state containing the generated application material
	in the "output_data" field, or None if execution fails.
	"""
	try:
	compiled_graph = build_job_app_graph()
	except Exception as e:
	logger.error("Error compiling graph: %s", e, exc_info=True)
	return None

	# Prepare enhanced LangSmith metadata and tags
	current_time = datetime.now()
	initial_workflow_state = self._build_initial_workflow_state()
	thread_id = f"job_workflow_session_{current_time:%Y%m%d%H%M%S}"
	timestamp = current_time.strftime("%Y%m%d-%H%M%S")

	# Descriptive run name for LangSmith UI
	run_name = f"JobAppWorkflow.{self.content}.{timestamp}"

	config: RunnableConfig = self._build_runnable_config()

	try:
	initial_workflow_state["current_node"] = NodeName.LOAD
	logger.info(
	f"Starting workflow execution: {run_name} "
	f"(content_type={self.content}, session_id={thread_id})"
	)
	graph_output = await compiled_graph.ainvoke(initial_workflow_state, config=config)
	logger.info("Workflow execution completed successfully")
	return graph_output
	except Exception as e:
	logger.error("Error running graph: %s", e, exc_info=True)
	return None


	def main():
	args = handle_cli()
	workflow = JobWorkflow(
	resume=args.resume,
	job_description_source=args.jd_source,
	content=args.content_type,
	)
	result = asyncio.run(workflow.run_workflow())
	if result and "output_data" in result:
	print_result(args.content_type, result.get("output_data", ""))
	save_result(args.content_type, result.get("output_data", ""))
	print("Workflow completed successfully.")
	else:
	print("Error running workflow. No output data available.")
	sys.exit(1)


	if __name__ == "__main__":
	main()