Spaces:

Jaimodiji
/

Report-Generator

Running

App Files Files Community

Ubuntu commited on 8 days ago

Commit

0d6e94b

1 Parent(s): f1ed485

Added changes to fix nemotron parse

Browse files

Files changed (6) hide show

config.py +1 -1
gemini_classification_prompt.txt +2 -6
gemini_classifier.py +3 -0
gemma_classifier.py +82 -40
processing.py +1 -1
redact.py +1 -1

config.py CHANGED Viewed

@@ -7,7 +7,7 @@ class Config:
     OUTPUT_FOLDER = 'output'
     DATABASE = 'database.db'
     NVIDIA_API_KEY = os.getenv("NVIDIA_API_KEY")
-    NIM_API_URL = "https://ai.api.nvidia.com/v1/cv/nvidia/nemoretriever-ocr-v1"
     NIM_HEADERS = {
         "Authorization": f"Bearer {NVIDIA_API_KEY}",
         "Accept": "application/json",

     OUTPUT_FOLDER = 'output'
     DATABASE = 'database.db'
     NVIDIA_API_KEY = os.getenv("NVIDIA_API_KEY")
+    NIM_API_URL = "https://ai.api.nvidia.com/v1/cv/nvidia/nemotron-ocr-v1"
     NIM_HEADERS = {
         "Authorization": f"Bearer {NVIDIA_API_KEY}",
         "Accept": "application/json",

gemini_classification_prompt.txt CHANGED Viewed

@@ -199,10 +199,6 @@ Your task is to analyze each question, first classify it into the most relevant
 Now classify the following question(s):
 ```
-8. first-order reaction has half-life 200 s. Time required for the amount of reactant to become one- eighth of its initial value is: (A) 200 s (B) 400 s (C) 600 s (D) 800 s
-9. Which hormone helps in internode/petiole elongation in deep water rice plants to keep leaves/ upper parts of the shoot above water? (A) Gibberellins (B) Zeatin (C) ABA (D) Ethylene
-10. Given below are two statements: The interphase nucleus has highly extended and elaborate nucleoprotein fibres called chromatin which contains DNA and some basic proteins called histones, some non-histone proteins and also RNA. Statement I: Statement II: A haploid set of chromosomes in humans contains 3.3 X 109 bp which is approximately two metre long thread of DNA distributed among its twenty three chromosomes. In the light of the above statements, choose the most appropriate answer from the options given below: (A) Statement is correct but Statement Il is incorrect. (B) Statement is incorrect but Statement ll is correct. (C) Both Statement and Statement ll are correct. (D) Both Statement and Statement ll are incorrect.
-11. A force F = - (yi + +x)) N acts on a particle moving in the xy plane. Starting from the origin, the particle is taken along the positive x-axis to the point (a, 0) m and then parallel to the y-axis to the point (a, a) m. The total work done (in joules) by the force is: (A) ka² (B) ka² (C) -2ka² (D) Zero
-12. On electrolysis of dilute nitric acid using platinum electrodes, the product obtained at the anode is: (A) H2 gas (B) O2 gas (C) NO2 gas (D) N2 gas
-13. Identify the incorrectly matched pair: (A) Petiole is modified for photosynthesis Australian acacia (B) Leaves modified into spines Cactus (C) Stem modified into a fleshy, cylindrical photosynthetic structure Opuntia (D) Stem modified into thorns Citrus
 ```

 Now classify the following question(s):
 ```
+1. 1. A parallel plate capacitor is charged by connecting it to a battery through a resistor. If I is the current in the circuit, then in the gap between the plates 1) There is no current 2) Displacement current of magnitude greater than flows but it can be any direction 3) Displacement current of magnitude equal to flows in a direction opposite to that of I. 4) Displacement current of magnitude equal to flows in the same direction as I. 2. For the following diagram [used to measure the length of a small metal piece by using vernier callipers], determine the length of the metal piece. Least count of the vernier callipers is 0.1 mm 10 15 20 mm Vernier scale Object 1) 18 mm 2) 15.7 mm 3) 12.6 mm 4) 10.2 mm
+2. 3. Statement I: The speed of whirlwind in a tornado is alarmingly high. Statement II: If no external torque acts on a body, its angular velocity remains conserved 1) Statement I is true, Statement II is true; Statement II is not the correct explanation of Statement I 2) Statement I is true, Statement II is false 3) Statement I is false, Statement II is true 4) Statement I is true, Statement II is true; Statement II is the correct explanation of Statement I
 ```

gemini_classifier.py CHANGED Viewed

@@ -229,7 +229,10 @@ Now classify the following question(s):
     with open('gemini_classification_prompt.txt', 'w') as f:
         f.write(prompt)
     url = f"https://generativelanguage.googleapis.com/v1beta/models/gemini-2.5-flash:generateContent?key={api_key}"
     headers = {'Content-Type': 'application/json'}
     request_body = {

     with open('gemini_classification_prompt.txt', 'w') as f:
         f.write(prompt)
+    # gemma-4-26b-a4b-it
     url = f"https://generativelanguage.googleapis.com/v1beta/models/gemini-2.5-flash:generateContent?key={api_key}"
     headers = {'Content-Type': 'application/json'}
     request_body = {

gemma_classifier.py CHANGED Viewed

@@ -1,92 +1,134 @@
-import os
 import json
 import requests
 import sys
 from typing import List, Dict, Any, Optional
 from api_key_manager import get_api_key_manager
 class GemmaClassifier:
     def __init__(self):
         # API key will be fetched dynamically via get_api_key_manager
         pass
     def classify(self, questions: List[str], start_index: int = 0) -> Optional[Dict[str, Any]]:
         """
-        Classifies a list of questions using the NVIDIA NIM Gemma API.
         `questions` should be a list of strings representing the questions to classify.
         `start_index` is the overall starting index for this batch (e.g., 0, 7, 14...).
         """
         manager = get_api_key_manager()
-        api_key, key_index = manager.get_key('nvidia')
         if not api_key:
-            raise ValueError("No available NVIDIA API keys. Please set NVIDIA_API_KEY environment variable.")
         full_prompt = self._generate_gemma_prompt(questions=questions, start_index=start_index)
-        url = "https://integrate.api.nvidia.com/v1/chat/completions"
         headers = {
-            "Authorization": f"Bearer {api_key}",
             "Content-Type": "application/json"
         }
         payload = {
-            "model": "google/gemma-3n-e4b-it",
-            "messages": [{"role": "user", "content": full_prompt}],
-            "temperature": 0.2,
-            "max_tokens": 2048,
-            "stream": False
         }
-        print(f"Sending batch to NVIDIA NIM Gemma API with {len(questions)} questions.")
         try:
             response = requests.post(url, headers=headers, json=payload, timeout=300)
             response.raise_for_status()
             response_json = response.json()
-            if 'choices' in response_json and len(response_json['choices']) > 0:
-                first_choice = response_json['choices'][0]
-                if 'message' in first_choice and 'content' in first_choice['message']:
-                    model_output_content = first_choice['message']['content']
-                    if model_output_content.startswith("```json") and model_output_content.endswith("```"):
-                        model_output_content = model_output_content[7:-3].strip()
-                    try:
-                        batch_result = json.loads(model_output_content)
-                        manager.mark_success('nvidia', key_index)
-                        return batch_result
-                    except json.JSONDecodeError as e:
-                        print(f"Error decoding JSON from model output: {e}", file=sys.stderr)
-                        print(f"Model output content: {model_output_content}", file=sys.stderr)
-                        manager.mark_failure('nvidia', key_index)
-                        return None
-                else:
-                    print("Error: 'message' or 'content' not found in NVIDIA NIM Gemma response choice.", file=sys.stderr)
-                    manager.mark_failure('nvidia', key_index)
-                    return None
-            else:
-                print("Error: 'choices' not found or empty in NVIDIA NIM Gemma response.", file=sys.stderr)
-                manager.mark_failure('nvidia', key_index)
                 return None
         except requests.exceptions.RequestException as e:
-            print(f"Error during NVIDIA NIM Gemma API call: {repr(e)}", file=sys.stderr)
             if e.response is not None:
                 print(f"Response status code: {e.response.status_code}", file=sys.stderr)
                 print(f"Response body: {e.response.text}", file=sys.stderr)
-            manager.mark_failure('nvidia', key_index)
             return None
         except Exception as e:
             print(f"An unexpected error occurred: {e}", file=sys.stderr)
-            manager.mark_failure('nvidia', key_index)
             return None
     def _generate_gemma_prompt(self, questions: List[str], start_index: int) -> str:
         """
-        Generates the detailed prompt for the Gemma classifier, similar to gemini_classifier.py.
         """
         input_text = "\n".join([f"{j + start_index + 1}. {q}" for j, q in enumerate(questions)])

 import json
 import requests
 import sys
 from typing import List, Dict, Any, Optional
 from api_key_manager import get_api_key_manager
 class GemmaClassifier:
+    MODEL_ID = "gemma-4-26b-a4b-it"
+    API_BASE = "https://generativelanguage.googleapis.com/v1beta/models"
     def __init__(self):
         # API key will be fetched dynamically via get_api_key_manager
         pass
     def classify(self, questions: List[str], start_index: int = 0) -> Optional[Dict[str, Any]]:
         """
+        Classifies a list of questions using the Gemini API (Gemma 4 model).
         `questions` should be a list of strings representing the questions to classify.
         `start_index` is the overall starting index for this batch (e.g., 0, 7, 14...).
         """
         manager = get_api_key_manager()
+        api_key, key_index = manager.get_key('gemini')
         if not api_key:
+            raise ValueError("No available Gemini API keys. Please set GEMINI_API_KEY environment variable.")
         full_prompt = self._generate_gemma_prompt(questions=questions, start_index=start_index)
+        url = f"{self.API_BASE}/{self.MODEL_ID}:streamGenerateContent?key={api_key}"
         headers = {
             "Content-Type": "application/json"
         }
         payload = {
+            "contents": [
+                {
+                    "role": "user",
+                    "parts": [
+                        {"text": full_prompt}
+                    ]
+                }
+            ],
+            "generationConfig": {
+                "thinkingConfig": {
+                    "thinkingLevel": "HIGH"
+                }
+            },
+            "tools": [
+                {
+                    "googleSearch": {}
+                }
+            ]
         }
+        print(f"Sending batch to Gemini API (Gemma 4) with {len(questions)} questions.")
         try:
             response = requests.post(url, headers=headers, json=payload, timeout=300)
             response.raise_for_status()
+            # streamGenerateContent returns a JSON array of chunks
             response_json = response.json()
+            # Accumulate all text parts across all chunks
+            model_output_content = self._extract_streamed_text(response_json)
+            if model_output_content is None:
+                print("Error: No text content found in Gemini API response.", file=sys.stderr)
+                manager.mark_failure('gemini', key_index)
+                return None
+            # Strip optional ```json ... ``` fences
+            cleaned = model_output_content.strip()
+            if cleaned.startswith("```json") and cleaned.endswith("```"):
+                cleaned = cleaned[7:-3].strip()
+            elif cleaned.startswith("```") and cleaned.endswith("```"):
+                cleaned = cleaned[3:-3].strip()
+            try:
+                batch_result = json.loads(cleaned)
+                manager.mark_success('gemini', key_index)
+                return batch_result
+            except json.JSONDecodeError as e:
+                print(f"Error decoding JSON from model output: {e}", file=sys.stderr)
+                print(f"Model output content: {model_output_content}", file=sys.stderr)
+                manager.mark_failure('gemini', key_index)
                 return None
         except requests.exceptions.RequestException as e:
+            print(f"Error during Gemini API call: {repr(e)}", file=sys.stderr)
             if e.response is not None:
                 print(f"Response status code: {e.response.status_code}", file=sys.stderr)
                 print(f"Response body: {e.response.text}", file=sys.stderr)
+            manager.mark_failure('gemini', key_index)
             return None
         except Exception as e:
             print(f"An unexpected error occurred: {e}", file=sys.stderr)
+            manager.mark_failure('gemini', key_index)
             return None
+    # ------------------------------------------------------------------
+    # Private helpers
+    # ------------------------------------------------------------------
+    def _extract_streamed_text(self, response_json) -> Optional[str]:
+        """
+        Gemini's streamGenerateContent returns a JSON array of candidate chunks.
+        Each chunk looks like:
+          {"candidates": [{"content": {"parts": [{"text": "..."}]}}]}
+        This method concatenates all text parts across all chunks.
+        """
+        parts_text = []
+        # response_json may be a list of chunks or a single dict
+        chunks = response_json if isinstance(response_json, list) else [response_json]
+        for chunk in chunks:
+            candidates = chunk.get("candidates", [])
+            for candidate in candidates:
+                content = candidate.get("content", {})
+                for part in content.get("parts", []):
+                    text = part.get("text")
+                    if text:
+                        parts_text.append(text)
+        return "".join(parts_text) if parts_text else None
     def _generate_gemma_prompt(self, questions: List[str], start_index: int) -> str:
         """
+        Generates the detailed prompt for the Gemma classifier.
         """
         input_text = "\n".join([f"{j + start_index + 1}. {q}" for j, q in enumerate(questions)])

processing.py CHANGED Viewed

@@ -12,7 +12,7 @@ from flask import current_app
 from api_key_manager import get_api_key_manager
 # --- NVIDIA NIM Configuration ---
-NIM_API_URL = "https://ai.api.nvidia.com/v1/cv/nvidia/nemoretriever-ocr-v1"
 def resize_image_if_needed(image_path: str) -> bytes:
     """Resizes an image to a maximum of 500x500 pixels and returns bytes."""

 from api_key_manager import get_api_key_manager
 # --- NVIDIA NIM Configuration ---
+NIM_API_URL = "https://ai.api.nvidia.com/v1/cv/nvidia/nemotron-ocr-v1"
 def resize_image_if_needed(image_path: str) -> bytes:
     """Resizes an image to a maximum of 500x500 pixels and returns bytes."""

redact.py CHANGED Viewed

@@ -10,7 +10,7 @@ import json
 # --- Configuration ---
 # API endpoints should remain constant
-INVOKE_URL_OCR = "https://ai.api.nvidia.com/v1/cv/nvidia/nemoretriever-ocr-v1"
 INVOKE_URL_PARSER = "https://integrate.api.nvidia.com/v1/chat/completions"
 # Define a max pixel count for the parser model to avoid sending overly large images.

 # --- Configuration ---
 # API endpoints should remain constant
+INVOKE_URL_OCR = "https://ai.api.nvidia.com/v1/cv/nvidia/nemotron-ocr-v1"
 INVOKE_URL_PARSER = "https://integrate.api.nvidia.com/v1/chat/completions"
 # Define a max pixel count for the parser model to avoid sending overly large images.