Spaces:

yoursdvniel
/

SmartInc-API

Sleeping

App Files Files Community

yoursdvniel commited on Apr 29

Commit

9fed675

verified ·

1 Parent(s): 9ed036f

Reset to old endpoints

Browse files

Files changed (1) hide show

main.py +0 -226

main.py CHANGED Viewed

@@ -520,160 +520,6 @@ def _normalize_outline_json(ai_result: Dict[str, Any]) -> Dict[str, Any]:
         ],
     }
-ALLOWED_INTAKE_EXTENSIONS = {"pdf", "docx", "txt"}
-MAX_INTAKE_DOC_CHARS = 25000
-def _allowed_intake_source(filename: str) -> bool:
-    return bool(filename and "." in filename and filename.rsplit(".", 1)[1].lower() in ALLOWED_INTAKE_EXTENSIONS)
-def _extract_text_from_txt_bytes(file_bytes: bytes) -> str:
-    return _clean_extracted_text(file_bytes.decode("utf-8", errors="ignore"))
-def _extract_intake_document_text(filename: str, file_bytes: bytes) -> str:
-    ext = filename.rsplit(".", 1)[1].lower()
-    if ext == "pdf":
-        return _extract_text_from_pdf_bytes(file_bytes)
-    if ext == "docx":
-        return _extract_text_from_docx_bytes(file_bytes)
-    if ext == "txt":
-        return _extract_text_from_txt_bytes(file_bytes)
-    raise ValueError("Unsupported file type")
-def _build_sme_intake_prompt(payload: Dict[str, Any]) -> str:
-    return f"""
-You are helping an SME complete an incubation application.
-The user may write in English, Shona, Ndebele, Zulu, or a mixture.
-Understand the mixed language, but return clean STRICT JSON only.
-Return this exact JSON shape:
-{{
-  "detectedLanguages": ["English"],
-  "profilePatch": {{
-    "participantName": null,
-    "gender": null,
-    "idNumber": null,
-    "phone": null,
-    "beneficiaryName": null,
-    "sector": null,
-    "natureOfBusiness": null,
-    "beeLevel": null,
-    "youthOwnedPercent": null,
-    "femaleOwnedPercent": null,
-    "blackOwnedPercent": null,
-    "dateOfRegistration": null,
-    "yearsOfTrading": null,
-    "registrationNumber": null,
-    "businessAddress": null,
-    "city": null,
-    "postalCode": null,
-    "province": null,
-    "hub": null,
-    "location": null
-  }},
-    "smeAssessment": {{
-    "urgencyLevel": "low|medium|high|urgent",
-    "urgencyScore": 0,
-    "businessStage": "idea|startup|early_growth|established|stagnant|struggling|distressed|growth_ready|unknown",
-    "riskLevel": "low|medium|high",
-    "priorityInterventionAreas": [
-      {
-        "area": "Financial Compliance|HSE & Labour Compliance|Legal Advisory Services|Market Linkages|PDS|Wellness Services|Training Academy|Marketing and Communication|ROM",
-        "urgency": "low|medium|high|urgent",
-        "reason": "",
-        "suggestedInterventions": []
-      }
-    ],
-    "classificationReasons": [],
-    "redFlags": [],
-    "growthSignals": []
-  }},
-  "applicationPatch": {{
-    "motivation": null,
-    "challenges": null,
-    "facebook": null,
-    "instagram": null,
-    "linkedIn": null,
-    "profile": {{}}
-  }},
-  "businessStory": {{
-    "summary": "",
-    "polished": "",
-    "strengths": [],
-    "risks": []
-  }},
-  "documentFindings": [
-    {{
-      "documentType": "Certified ID Copy|Proof of Address|B-BBEE Certificate|Tax PIN|CIPC|Management Accounts|Three Months Bank Statements|Unknown",
-      "filename": "",
-      "extractedFields": {{}},
-      "confidence": 0,
-      "warnings": []
-    }}
-  ],
-  "missingFields": [
-    {{
-      "field": "",
-      "section": "profile|application|program",
-      "label": "",
-      "question": "",
-      "reason": ""
-    }}
-  ],
-  "missingDocuments": [
-    {{
-      "type": "",
-      "reason": ""
-    }}
-  ],
-  "nextQuestion": "",
-  "confidence": 0,
-  "warnings": []
-}}
-Rules:
-- Do not invent values.
-- Use documents for official values like ID number, registration number, business name, registration date, address, B-BBEE level, tax details.
-- If a document contradicts typed text, keep the document value and add a warning.
-- Only return fields that are reasonably supported.
-- For programQuestions, fill applicationPatch.profile using the question id as the key.
-- Ask one best next question in nextQuestion.
-- If nothing important is missing, nextQuestion must be empty.
-- Use South African SMME/incubation context.
-SME assessment rules:
-- urgencyScore must be 0 to 100.
-- urgent = 80-100, high = 60-79, medium = 35-59, low = 0-34.
-- Classify businessStage using the available facts:
-  - idea/startup: newly registered, little or no trading/revenue, business still forming.
-  - early_growth: trading with some traction but systems/compliance/markets still weak.
-  - established: trading for several years with stable operations.
-  - stagnant: revenue, staff, market access, or growth has not improved for a long period.
-  - struggling: serious operational, compliance, cash flow, market, staffing, or documentation gaps.
-  - distressed: severe survival risk, legal/financial/compliance crisis, or inability to trade normally.
-  - growth_ready: stable/compliant business needing market access, finance, procurement, branding, or scale support.
-  - unknown: not enough evidence.
-- Rate urgency higher when there are signs of missing compliance documents, no CIPC/tax/B-BBEE, no bank statements, weak financial records, no contracts, labour/HSE exposure, stagnant revenue, low market access, legal risks, poor business planning, or severe founder/business challenges.
-- Priority intervention areas must align with Lepharo departments:
-  ROM, HSE & Labour Compliance, Financial Compliance, PDS, Market Linkages, Legal Advisory Services, Wellness Services, Training Academy, Marketing and Communication.
-- classificationReasons must explain why the stage and urgency were selected.
-- redFlags must list serious risks.
-- growthSignals must list positive signs.
-- suggestedInterventions must be practical intervention titles, not vague advice.
-Payload:
-{json.dumps(payload, ensure_ascii=False)}
-""".strip()
 # -- route ---------------------------------------------------------------
 @app.route('/chat', methods=['POST'])
@@ -1121,78 +967,6 @@ def generate_course_outline():
             "error": "Failed to generate course outline from file"
         }), 500
-@app.route('/analyze-sme-application-intake', methods=['POST'])
-def analyze_sme_application_intake():
-    try:
-        role = request.form.get("role")
-        company_code = request.form.get("companyCode")
-        user_id = request.form.get("userId")
-        program_id = request.form.get("programId")
-        program_name = request.form.get("programName")
-        raw_story = request.form.get("rawStory") or ""
-        profile_values = json.loads(request.form.get("profileValuesJson") or "{}")
-        application_values = json.loads(request.form.get("applicationValuesJson") or "{}")
-        program_questions = json.loads(request.form.get("programQuestionsJson") or "[]")
-        required_documents = json.loads(request.form.get("requiredDocumentsJson") or "[]")
-        if not role or not company_code or not user_id:
-            return jsonify({"error": "Missing role, companyCode, or userId"}), 400
-        uploaded_files = request.files.getlist("files")
-        document_payloads = []
-        for uploaded in uploaded_files:
-            filename = uploaded.filename or ""
-            if not _allowed_intake_source(filename):
-                document_payloads.append({
-                    "filename": filename,
-                    "text": "",
-                    "warning": "Unsupported file type"
-                })
-                continue
-            file_bytes = uploaded.read()
-            extracted = _extract_intake_document_text(filename, file_bytes)
-            document_payloads.append({
-                "filename": filename,
-                "contentType": uploaded.content_type,
-                "text": _truncate_source_text(extracted, MAX_INTAKE_DOC_CHARS)
-            })
-        payload = {
-            "role": role,
-            "companyCode": company_code,
-            "userId": user_id,
-            "programId": program_id,
-            "programName": program_name,
-            "rawStory": raw_story,
-            "currentProfileValues": profile_values,
-            "currentApplicationValues": application_values,
-            "programQuestions": program_questions,
-            "requiredDocuments": required_documents,
-            "documents": document_payloads
-        }
-        system_msg = {
-            "role": "system",
-            "content": "You extract SME application data. Return strict JSON only."
-        }
-        user_msg = {
-            "role": "user",
-            "content": _build_sme_intake_prompt(payload)
-        }
-        ai_raw = ask_gpt([system_msg, user_msg])
-        parsed = _extract_json_block(ai_raw)
-        return jsonify(to_jsonable(parsed))
-    except Exception as e:
-        print("analyze_sme_application_intake_failed:", e)
-        return jsonify({"error": "Failed to analyse SME application intake"}), 500
 if __name__ == "__main__":
     app.run(host="0.0.0.0", port=7860)

         ],
     }
 # -- route ---------------------------------------------------------------
 @app.route('/chat', methods=['POST'])
             "error": "Failed to generate course outline from file"
         }), 500
 if __name__ == "__main__":
     app.run(host="0.0.0.0", port=7860)