Spaces:

Kaito117
/

linkedin_profile_scoring

No application file

App Files Files Community

Kaito117 commited on Jun 30, 2025

Commit

4ea17aa

1 Parent(s): c556cb0

hf spaces setup files

Browse files

Files changed (5) hide show

Dockerfile_spaces +34 -0
README_API.md +108 -0
README_spaces.md +8 -0
api_main.py +255 -0
demo_api.py +113 -0

Dockerfile_spaces ADDED Viewed

	@@ -0,0 +1,34 @@

+FROM python:3.11-slim
+WORKDIR /app
+# Install system dependencies
+RUN apt-get update && apt-get install -y \
+    curl \
+    && rm -rf /var/lib/apt/lists/*
+# Copy requirements and install Python dependencies
+COPY requirements.txt .
+COPY pyproject.toml .
+RUN pip install --no-cache-dir -r requirements.txt
+RUN pip install --no-cache-dir fastapi uvicorn
+# Copy application code
+COPY . .
+# Create necessary directories
+RUN mkdir -p /app/logs
+# Set environment variables
+ENV PYTHONPATH=/app
+ENV PORT=7860
+# Expose port
+EXPOSE 7860
+# Health check
+HEALTHCHECK --interval=30s --timeout=30s --start-period=5s --retries=3 \
+    CMD curl -f http://localhost:7860/health || exit 1
+# Run the application
+CMD ["python", "api_main.py"]

README_API.md ADDED Viewed

	@@ -0,0 +1,108 @@

+# LinkedIn Sourcing Agent API 🎯
+An AI-powered candidate sourcing and scoring system that automatically finds, analyzes, and ranks LinkedIn candidates for job openings.
+## 🚀 Features
+- **Intelligent Search**: Generates optimized search queries for LinkedIn candidate discovery
+- **Profile Analysis**: Extracts and structures candidate data using advanced parsing
+- **AI Scoring**: Multi-dimensional scoring algorithm evaluating education, experience, skills, and cultural fit
+- **Personalized Outreach**: Generates tailored outreach messages highlighting candidate strengths
+- **RESTful API**: Easy integration with existing HR systems and workflows
+## 📡 API Usage
+### POST `/source-candidates`
+Submit a job description and get ranked candidates with personalized outreach messages.
+**Request:**
+```json
+{
+  "title": "Software Engineer, ML Research",
+  "company": "Windsurf",
+  "location": "Mountain View, CA",
+  "requirements": [
+    "Experience with large language models (LLMs)",
+    "Strong background in machine learning and AI",
+    "PhD or Master's in Computer Science or related field"
+  ],
+  "description": "We are looking for a talented ML Research Engineer...",
+  "max_candidates": 10,
+  "confidence_threshold": 0.3
+}
+```
+**Response:**
+```json
+{
+  "job_id": "abc123",
+  "job_title": "Software Engineer, ML Research",
+  "company": "Windsurf",
+  "candidates_found": 5,
+  "candidates_scored": 5,
+  "top_candidates": [
+    {
+      "name": "John Doe",
+      "linkedin_url": "https://linkedin.com/in/johndoe",
+      "fit_score": 8.5,
+      "confidence": 0.9,
+      "adjusted_score": 7.65,
+      "key_highlights": [
+        "PhD in Computer Science from Stanford",
+        "Current: Senior ML Engineer at Google",
+        "Skills: LLM, PyTorch, TensorFlow"
+      ],
+      "outreach_message": "Hi John, I noticed your impressive work with LLMs at Google and think you'd be perfect for our ML Research role at Windsurf...",
+      "profile_summary": {
+        "name": "John Doe",
+        "headline": "Senior ML Engineer | LLM Specialist",
+        "current_company": "Google",
+        "score_breakdown": {
+          "education": 9.5,
+          "career_trajectory": 8.0,
+          "company_relevance": 9.0,
+          "experience_match": 8.5
+        }
+      }
+    }
+  ],
+  "processing_time": 12.5,
+  "status": "completed",
+  "timestamp": "2025-07-01T02:30:00Z"
+}
+```
+## 🔧 Endpoints
+- `GET /` - API information
+- `GET /health` - Health check
+- `POST /source-candidates` - Main sourcing endpoint
+- `GET /example` - Example request format
+- `GET /docs` - Interactive API documentation
+## 🎯 Scoring Algorithm
+The system evaluates candidates across multiple dimensions:
+- **Education** (25%): University prestige, degree relevance, field of study
+- **Experience Match** (30%): Role similarity, industry relevance, skill alignment
+- **Career Trajectory** (20%): Progression, tenure, company quality
+- **Company Relevance** (15%): Similar company experience, industry fit
+- **Location Match** (10%): Geographic compatibility
+## 🚀 Quick Start
+1. Visit the API documentation at `/docs`
+2. Try the `/example` endpoint to see request format
+3. Submit a job via `/source-candidates`
+4. Get ranked candidates with personalized messages
+## 🔐 Note
+This demo uses mock data for educational purposes. In production, you would need:
+- Valid LinkedIn API access
+- SerpAPI key for search
+- Groq API key for LLM processing
+Built with FastAPI, Pydantic, and modern async Python.

README_spaces.md ADDED Viewed

	@@ -0,0 +1,8 @@

+title: LinkedIn Sourcing Agent API
+emoji: 🎯
+colorFrom: blue
+colorTo: purple
+sdk: docker
+pinned: false
+license: mit
+app_port: 7860

api_main.py ADDED Viewed

	@@ -0,0 +1,255 @@

+#!/usr/bin/env python3
+"""
+FastAPI application for LinkedIn Candidate Sourcing Agent
+Deployable to HuggingFace Spaces
+"""
+from fastapi import FastAPI, HTTPException
+from fastapi.middleware.cors import CORSMiddleware
+from pydantic import BaseModel, Field
+from typing import List, Optional
+import asyncio
+import logging
+from datetime import datetime
+# Import your existing components
+from app.models.schemas import JobProcessingRequest, JobDescription
+from app.services.agent import LinkedInSourcingAgent
+# Configure logging
+logging.basicConfig(level=logging.INFO)
+logger = logging.getLogger(__name__)
+# FastAPI app
+app = FastAPI(
+    title="LinkedIn Sourcing Agent API",
+    description="AI-powered candidate sourcing and scoring system",
+    version="1.0.0",
+    docs_url="/docs",
+    redoc_url="/redoc"
+)
+# Add CORS middleware
+app.add_middleware(
+    CORSMiddleware,
+    allow_origins=["*"],
+    allow_credentials=True,
+    allow_methods=["*"],
+    allow_headers=["*"],
+)
+# Initialize the agent
+agent = LinkedInSourcingAgent()
+# API Models
+class JobInput(BaseModel):
+    title: str = Field(..., description="Job title", example="Software Engineer, ML Research")
+    company: str = Field(..., description="Company name", example="Windsurf")
+    location: Optional[str] = Field(None, description="Job location", example="Mountain View, CA")
+    requirements: List[str] = Field(
+        default_factory=list,
+        description="List of job requirements",
+        example=[
+            "Experience with large language models (LLMs)",
+            "Strong background in machine learning and AI",
+            "PhD or Master's in Computer Science or related field"
+        ]
+    )
+    description: Optional[str] = Field(
+        None,
+        description="Detailed job description",
+        example="We are looking for a talented ML Research Engineer to join our team working on cutting-edge AI technologies."
+    )
+    max_candidates: int = Field(10, ge=1, le=50, description="Maximum number of candidates to find")
+    confidence_threshold: float = Field(0.3, ge=0, le=1, description="Minimum confidence threshold")
+class CandidateOutput(BaseModel):
+    name: str
+    linkedin_url: str
+    fit_score: float
+    confidence: float
+    adjusted_score: float
+    key_highlights: List[str]
+    outreach_message: str
+    profile_summary: dict
+class SourcingResponse(BaseModel):
+    job_id: str
+    job_title: str
+    company: str
+    candidates_found: int
+    candidates_scored: int
+    top_candidates: List[CandidateOutput]
+    processing_time: float
+    status: str
+    timestamp: datetime
+# Helper function to convert ScoredCandidate to API format
+def convert_scored_candidate(candidate) -> CandidateOutput:
+    """Convert internal ScoredCandidate to API response format"""
+    # Extract key highlights from profile
+    key_highlights = []
+    profile = candidate.profile
+    # Add education highlights
+    if profile.education:
+        for edu in profile.education[:2]:  # Top 2 education entries
+            if edu.institution and edu.degree:
+                key_highlights.append(f"{edu.degree} from {edu.institution}")
+    # Add experience highlights
+    if profile.experience:
+        current_exp = profile.experience[0]
+        key_highlights.append(f"Current: {current_exp.title} at {current_exp.company}")
+        if len(profile.experience) > 1:
+            prev_exp = profile.experience[1]
+            key_highlights.append(f"Previous: {prev_exp.title} at {prev_exp.company}")
+    # Add skills highlight
+    if profile.skills:
+        top_skills = profile.skills[:5]  # Top 5 skills
+        key_highlights.append(f"Skills: {', '.join(top_skills)}")
+    # Add location if available
+    if profile.location:
+        key_highlights.append(f"Location: {profile.location}")
+    # Create profile summary
+    profile_summary = {
+        "name": profile.name,
+        "headline": profile.headline,
+        "current_company": profile.current_company,
+        "current_position": profile.current_position,
+        "location": profile.location,
+        "education_count": len(profile.education),
+        "experience_count": len(profile.experience),
+        "skills_count": len(profile.skills),
+        "score_breakdown": {
+            "education": candidate.score_breakdown.education,
+            "career_trajectory": candidate.score_breakdown.career_trajectory,
+            "company_relevance": candidate.score_breakdown.company_relevance,
+            "experience_match": candidate.score_breakdown.experience_match,
+        }
+    }
+    return CandidateOutput(
+        name=profile.name,
+        linkedin_url=profile.linkedin_url,
+        fit_score=candidate.fit_score,
+        confidence=candidate.confidence,
+        adjusted_score=candidate.adjusted_score,
+        key_highlights=key_highlights,
+        outreach_message=candidate.outreach_message,
+        profile_summary=profile_summary
+    )
+@app.get("/")
+async def root():
+    """Health check endpoint"""
+    return {
+        "message": "LinkedIn Sourcing Agent API",
+        "status": "active",
+        "version": "1.0.0",
+        "docs": "/docs"
+    }
+@app.get("/health")
+async def health_check():
+    """Detailed health check"""
+    return {
+        "status": "healthy",
+        "timestamp": datetime.now().isoformat(),
+        "service": "linkedin-sourcing-agent"
+    }
+@app.post("/source-candidates", response_model=SourcingResponse)
+async def source_candidates(job_input: JobInput):
+    """
+    Source and score candidates for a given job description
+    This endpoint:
+    1. Searches for LinkedIn candidates based on job requirements
+    2. Extracts and analyzes candidate profiles
+    3. Scores candidates using AI-powered algorithms
+    4. Generates personalized outreach messages
+    5. Returns top candidates ranked by fit score
+    """
+    try:
+        logger.info(f"Processing job request: {job_input.title} at {job_input.company}")
+        # Convert API input to internal format
+        job_desc = JobDescription(
+            title=job_input.title,
+            company=job_input.company,
+            location=job_input.location,
+            requirements=job_input.requirements,
+            description=job_input.description or f"Join {job_input.company} as a {job_input.title}"
+        )
+        # Create processing request
+        request = JobProcessingRequest(
+            job_description=job_desc,
+            max_candidates=job_input.max_candidates,
+            confidence_threshold=job_input.confidence_threshold
+        )
+        # Process the job
+        result = await agent.process_job(request)
+        # Convert candidates to API format
+        api_candidates = []
+        for candidate in result.candidates[:10]:  # Top 10 candidates
+            try:
+                api_candidate = convert_scored_candidate(candidate)
+                api_candidates.append(api_candidate)
+            except Exception as e:
+                logger.warning(f"Failed to convert candidate: {e}")
+                continue
+        response = SourcingResponse(
+            job_id=result.job_id,
+            job_title=job_input.title,
+            company=job_input.company,
+            candidates_found=result.candidates_found,
+            candidates_scored=len(result.candidates),
+            top_candidates=api_candidates,
+            processing_time=result.processing_time,
+            status=result.status,
+            timestamp=datetime.now()
+        )
+        logger.info(f"Successfully processed job. Found {len(api_candidates)} candidates")
+        return response
+    except Exception as e:
+        logger.error(f"Error processing job request: {str(e)}")
+        raise HTTPException(
+            status_code=500,
+            detail=f"Failed to process job request: {str(e)}"
+        )
+@app.get("/example")
+async def get_example():
+    """Get an example job input for testing"""
+    return {
+        "example_input": {
+            "title": "Software Engineer, ML Research",
+            "company": "Windsurf",
+            "location": "Mountain View, CA",
+            "requirements": [
+                "Experience with large language models (LLMs)",
+                "Strong background in machine learning and AI",
+                "PhD or Master's in Computer Science or related field",
+                "Experience with search and ranking systems",
+                "Python and deep learning frameworks"
+            ],
+            "description": "We are looking for a talented ML Research Engineer to join our team working on cutting-edge AI technologies. You will be responsible for developing and improving large language models, search algorithms, and AI-powered features.",
+            "max_candidates": 5,
+            "confidence_threshold": 0.3
+        }
+    }
+if __name__ == "__main__":
+    import uvicorn
+    uvicorn.run(app, host="0.0.0.0", port=7860)  # Port 7860 is standard for HuggingFace Spaces

demo_api.py ADDED Viewed

	@@ -0,0 +1,113 @@

+#!/usr/bin/env python3
+"""
+Demo script to test the LinkedIn Sourcing Agent API
+"""
+import requests
+import json
+import time
+# API base URL (adjust for your deployment)
+BASE_URL = "http://localhost:7860"  # Local testing
+# BASE_URL = "https://your-huggingface-space.hf.space"  # HuggingFace deployment
+def test_api():
+    """Test the API with a sample job"""
+    print("🎯 LinkedIn Sourcing Agent API Demo")
+    print("=" * 50)
+    # Test health check
+    print("1. Health Check...")
+    try:
+        response = requests.get(f"{BASE_URL}/health")
+        if response.status_code == 200:
+            print("✅ API is healthy")
+        else:
+            print("❌ API health check failed")
+            return
+    except Exception as e:
+        print(f"❌ Cannot connect to API: {e}")
+        return
+    # Get example request format
+    print("\n2. Getting example format...")
+    try:
+        response = requests.get(f"{BASE_URL}/example")
+        example = response.json()
+        print("✅ Example format retrieved")
+    except Exception as e:
+        print(f"❌ Failed to get example: {e}")
+        return
+    # Test job sourcing
+    print("\n3. Testing candidate sourcing...")
+    job_data = {
+        "title": "Software Engineer, ML Research",
+        "company": "Windsurf",
+        "location": "Mountain View, CA",
+        "requirements": [
+            "Experience with large language models (LLMs)",
+            "Strong background in machine learning and AI",
+            "PhD or Master's in Computer Science or related field",
+            "Experience with search and ranking systems",
+            "Python and deep learning frameworks"
+        ],
+        "description": "We are looking for a talented ML Research Engineer to join our team working on cutting-edge AI technologies. You will be responsible for developing and improving large language models, search algorithms, and AI-powered features.",
+        "max_candidates": 5,
+        "confidence_threshold": 0.3
+    }
+    print(f"📋 Job: {job_data['title']} at {job_data['company']}")
+    print("🔍 Searching for candidates...")
+    start_time = time.time()
+    try:
+        response = requests.post(
+            f"{BASE_URL}/source-candidates",
+            json=job_data,
+            timeout=60  # 60 second timeout
+        )
+        if response.status_code == 200:
+            result = response.json()
+            processing_time = time.time() - start_time
+            print(f"✅ Search completed in {processing_time:.1f}s")
+            print(f"📊 Results:")
+            print(f"   Job ID: {result['job_id']}")
+            print(f"   Candidates Found: {result['candidates_found']}")
+            print(f"   Candidates Scored: {result['candidates_scored']}")
+            print(f"   Top Candidates: {len(result['top_candidates'])}")
+            print(f"   Status: {result['status']}")
+            # Show top candidates
+            print(f"\n🎯 Top Candidates:")
+            for i, candidate in enumerate(result['top_candidates'][:3], 1):
+                print(f"\n   {i}. {candidate['name']}")
+                print(f"      Fit Score: {candidate['fit_score']}/10")
+                print(f"      Confidence: {candidate['confidence']}")
+                print(f"      Adjusted Score: {candidate['adjusted_score']}")
+                print(f"      Company: {candidate['profile_summary']['current_company']}")
+                print(f"      LinkedIn: {candidate['linkedin_url']}")
+                print(f"      Key Highlights:")
+                for highlight in candidate['key_highlights'][:3]:
+                    print(f"        • {highlight}")
+                print(f"      Outreach: {candidate['outreach_message'][:100]}...")
+            # Save full results
+            with open('demo_results.json', 'w') as f:
+                json.dump(result, f, indent=2, default=str)
+            print(f"\n💾 Full results saved to demo_results.json")
+        else:
+            print(f"❌ API request failed: {response.status_code}")
+            print(f"   Error: {response.text}")
+    except requests.exceptions.Timeout:
+        print("⏰ Request timeout - this is normal for complex searches")
+    except Exception as e:
+        print(f"❌ Request failed: {e}")
+if __name__ == "__main__":
+    test_api()