Spaces:

Borislav18
/

Shedify

Runtime error

App Files Files Community

Borislav18 commited on Mar 27

Commit

c3dfa5f

1 Parent(s): 6ccc1d7

Update space

Browse files

Files changed (2) hide show

app.py +249 -21
requirements.txt +11 -1

app.py CHANGED Viewed

@@ -1,11 +1,88 @@
 import gradio as gr
-from huggingface_hub import InferenceClient
 """
-For more information on `huggingface_hub` Inference API support, please check the docs: https://huggingface.co/docs/huggingface_hub/v0.22.2/en/guides/inference
 """
-client = InferenceClient("HuggingFaceH4/zephyr-7b-beta")
 def respond(
     message,
@@ -17,6 +94,7 @@ def respond(
 ):
     messages = [{"role": "system", "content": system_message}]
     for val in history:
         if val[0]:
             messages.append({"role": "user", "content": val[0]})
@@ -27,6 +105,7 @@ def respond(
     response = ""
     for message in client.chat_completion(
         messages,
         max_tokens=max_tokens,
@@ -39,26 +118,175 @@ def respond(
         response += token
         yield response
-"""
-For information on how to customize the ChatInterface, peruse the gradio docs: https://www.gradio.app/docs/chatinterface
-"""
-demo = gr.ChatInterface(
-    respond,
-    additional_inputs=[
-        gr.Textbox(value="You are a friendly Chatbot.", label="System message"),
-        gr.Slider(minimum=1, maximum=2048, value=512, step=1, label="Max new tokens"),
-        gr.Slider(minimum=0.1, maximum=4.0, value=0.7, step=0.1, label="Temperature"),
-        gr.Slider(
-            minimum=0.1,
-            maximum=1.0,
-            value=0.95,
-            step=0.05,
-            label="Top-p (nucleus sampling)",
-        ),
-    ],
-)
 if __name__ == "__main__":
     demo.launch()

 import gradio as gr
+import os
+import json
+import time
+import subprocess
+import threading
+import uuid
+from pathlib import Path
+from huggingface_hub import InferenceClient, HfFolder
 """
+Shedify app - Using fine-tuned Llama 3.3 49B for document assistance
 """
+# Model settings
+DEFAULT_MODEL = "Borislav18/Shedify"  # Your Hugging Face username/model name
+LOCAL_MODEL = os.environ.get("LOCAL_MODEL", None)  # Set this if testing locally
+# Get Hugging Face token
+HF_TOKEN = os.environ.get("HF_TOKEN", None)
+# App title and description
+title = "Shedify - Document Assistant powered by Llama 3.3"
+description = """
+This app uses a fine-tuned version of Llama 3.3 49B model trained on your documents.
+Ask questions about the documents, generate insights, or request summaries!
+"""
+# Initialize inference client with your model
+client = InferenceClient(
+    DEFAULT_MODEL,
+    token=HF_TOKEN,
+)
+# Training status tracking
+class TrainingState:
+    def __init__(self):
+        self.status = "idle"  # idle, running, success, failed
+        self.progress = 0.0   # 0.0 to 1.0
+        self.message = ""
+        self.id = str(uuid.uuid4())[:8]  # Generate a unique ID for this session
+        # Check if state file exists and load it
+        self.state_file = Path("training_state.json")
+        self.load_state()
+    def load_state(self):
+        """Load state from file if it exists"""
+        if self.state_file.exists():
+            try:
+                with open(self.state_file, "r") as f:
+                    state = json.load(f)
+                self.status = state.get("status", "idle")
+                self.progress = state.get("progress", 0.0)
+                self.message = state.get("message", "")
+                self.id = state.get("id", self.id)
+            except Exception as e:
+                print(f"Error loading state: {e}")
+    def save_state(self):
+        """Save current state to file"""
+        try:
+            with open(self.state_file, "w") as f:
+                json.dump({
+                    "status": self.status,
+                    "progress": self.progress,
+                    "message": self.message,
+                    "id": self.id
+                }, f)
+        except Exception as e:
+            print(f"Error saving state: {e}")
+    def update(self, status=None, progress=None, message=None):
+        """Update state and save it"""
+        if status is not None:
+            self.status = status
+        if progress is not None:
+            self.progress = progress
+        if message is not None:
+            self.message = message
+        self.save_state()
+        return self.status, self.progress, self.message
+# Initialize the training state
+training_state = TrainingState()
 def respond(
     message,
 ):
     messages = [{"role": "system", "content": system_message}]
+    # Format history to match chat completion format
     for val in history:
         if val[0]:
             messages.append({"role": "user", "content": val[0]})
     response = ""
+    # Use streaming to get real-time responses
     for message in client.chat_completion(
         messages,
         max_tokens=max_tokens,
         response += token
         yield response
+def run_training_process(pdf_dir, output_name, progress_callback):
+    """Run the PDF processing and fine-tuning process"""
+    try:
+        # Create processed_data directory if it doesn't exist
+        os.makedirs("processed_data", exist_ok=True)
+        # Update state
+        progress_callback("running", 0.05, "Processing PDFs...")
+        # Process PDFs
+        pdf_process = subprocess.run(
+            ["python", "pdf_processor.py", "--pdf_dir", pdf_dir, "--output_dir", "processed_data"],
+            capture_output=True,
+            text=True
+        )
+        if pdf_process.returncode != 0:
+            progress_callback("failed", 0.0, f"PDF processing failed: {pdf_process.stderr}")
+            return False
+        # Update state
+        progress_callback("running", 0.3, "PDFs processed. Starting fine-tuning...")
+        # Get Hugging Face token
+        hf_token = HF_TOKEN or HfFolder.get_token()
+        if not hf_token:
+            progress_callback("failed", 0.0, "No Hugging Face token found. Please set the HF_TOKEN environment variable.")
+            return False
+        # Run fine-tuning
+        finetune_process = subprocess.run(
+            [
+                "python", "finetune_llama3.py",
+                "--dataset_path", "processed_data/training_data",
+                "--hub_model_id", f"Borislav18/{output_name}",
+                "--epochs", "1",  # Starting with 1 epoch for quicker feedback
+                "--gradient_accumulation_steps", "4"
+            ],
+            env={**os.environ, "HF_TOKEN": hf_token},
+            capture_output=True,
+            text=True
+        )
+        if finetune_process.returncode != 0:
+            progress_callback("failed", 0.0, f"Fine-tuning failed: {finetune_process.stderr}")
+            return False
+        # Update state
+        progress_callback("success", 1.0, f"Training complete! Model pushed to Hugging Face as Borislav18/{output_name}")
+        return True
+    except Exception as e:
+        progress_callback("failed", 0.0, f"Training process failed with error: {str(e)}")
+        return False
+def training_thread(pdf_dir, output_name):
+    """Background thread for running training"""
+    def progress_callback(status, progress, message):
+        training_state.update(status, progress, message)
+    # Simulate progress updates for UI feedback
+    progress_callback("running", 0.01, "Starting training process...")
+    # Run the actual training process
+    run_training_process(pdf_dir, output_name, progress_callback)
+def start_training(pdf_dir, output_name):
+    """Start the training process in a background thread"""
+    if not pdf_dir or not output_name:
+        return "Please provide both a PDF directory and output model name", 0.0, "idle"
+    # Check if already running
+    if training_state.status == "running":
+        return f"Training already in progress: {training_state.message}", training_state.progress, training_state.status
+    # Start background thread
+    thread = threading.Thread(
+        target=training_thread,
+        args=(pdf_dir, output_name),
+        daemon=True
+    )
+    thread.start()
+    return "Training started...", 0.0, "running"
+def get_training_status():
+    """Get the current training status for UI updates"""
+    return training_state.message, training_state.progress, training_state.status
+# Create the main application
+with gr.Blocks(title="Shedify - Document Assistant") as demo:
+    with gr.Row():
+        with gr.Column(scale=2):
+            gr.Markdown(f"# {title}")
+            gr.Markdown(description)
+        with gr.Column(scale=1):
+            # Training controls
+            with gr.Group(visible=True):
+                gr.Markdown("## Train New Model")
+                pdf_dir = gr.Textbox(label="PDF Directory", placeholder="Path to directory containing PDFs")
+                output_name = gr.Textbox(label="Model Name", placeholder="Name for your fine-tuned model", value="Shedify-v1")
+                train_btn = gr.Button("Start Training")
+                training_message = gr.Textbox(label="Training Status", interactive=False)
+                training_progress = gr.Slider(
+                    minimum=0, maximum=1, value=0,
+                    label="Progress", interactive=False
+                )
+                training_status = gr.Textbox(visible=False)
+    # Chat interface
+    chatbot = gr.ChatInterface(
+        fn=respond,
+        additional_inputs=[
+            gr.Textbox(
+                value="You are an AI assistant trained on specific documents. Answer questions based only on information from these documents. If you don't know the answer from the documents, say so clearly.",
+                label="System message"
+            ),
+            gr.Slider(minimum=1, maximum=2048, value=1024, step=1, label="Max new tokens"),
+            gr.Slider(minimum=0.1, maximum=2.0, value=0.7, step=0.1, label="Temperature"),
+            gr.Slider(
+                minimum=0.1,
+                maximum=1.0,
+                value=0.9,
+                step=0.05,
+                label="Top-p (nucleus sampling)",
+            ),
+        ],
+        examples=[
+            ["Summarize the key points from all documents you were trained on."],
+            ["What are the main themes discussed in the documents?"],
+            ["Extract the most important concepts mentioned in the documents."],
+            ["Explain the relationship between the different topics in the documents."],
+            ["What recommendations or conclusions can be drawn from the documents?"],
+        ]
+    )
+    # Set up event handlers
+    train_btn.click(
+        fn=start_training,
+        inputs=[pdf_dir, output_name],
+        outputs=[training_message, training_progress, training_status]
+    )
+    # Setup periodic status checking
+    demo.load(get_training_status, outputs=[training_message, training_progress, training_status])
+    def update_ui(message, progress, status):
+        is_running = status == "running"
+        color = {
+            "idle": "gray",
+            "running": "blue",
+            "success": "green",
+            "failed": "red"
+        }.get(status, "gray")
+        message_with_color = f"<span style='color: {color}'>{message}</span>"
+        return message_with_color, progress, train_btn.update(interactive=not is_running)
+    training_status.change(
+        fn=update_ui,
+        inputs=[training_message, training_progress, training_status],
+        outputs=[training_message, training_progress, train_btn]
+    )
+    # Set interval to update the UI every few seconds
+    demo.add_event_handler("load", None, None, None, None, interval=5.0, inputs=None, outputs=[training_message, training_progress, training_status], _js=None, fn=get_training_status)
 if __name__ == "__main__":
     demo.launch()

requirements.txt CHANGED Viewed

	@@ -1 +1,11 @@
1	- huggingface_hub==0.25.2

+huggingface_hub>=0.25.2
+gradio>=5.0.1
+transformers>=4.36.0
+peft>=0.7.0
+datasets>=2.14.0
+accelerate>=0.25.0
+trl>=0.7.1
+bitsandbytes>=0.40.0
+torch>=2.0.0
+PyPDF2>=3.0.0
+tqdm>=4.65.0