future-html

Sleeping

App Files Files Community

aadya1762 commited on Mar 20, 2025

Commit

3a14fb3

1 Parent(s): d71e3b1

add examples functionality

Browse files

Files changed (4) hide show

gemmademo/__init__.py +0 -2
gemmademo/_chat.py +70 -16
gemmademo/_model.py +4 -4
gemmademo/_utils.py +0 -7

gemmademo/__init__.py CHANGED Viewed

@@ -1,11 +1,9 @@
 from ._chat import GradioChat
 from ._model import LlamaCppGemmaModel
 from ._prompts import PromptManager
-from ._utils import huggingface_login
 __all__ = [
     "GradioChat",
     "LlamaCppGemmaModel",
     "PromptManager",
-    "huggingface_login",
 ]

 from ._chat import GradioChat
 from ._model import LlamaCppGemmaModel
 from ._prompts import PromptManager
 __all__ = [
     "GradioChat",
     "LlamaCppGemmaModel",
     "PromptManager",
 ]

gemmademo/_chat.py CHANGED Viewed

@@ -67,23 +67,77 @@ class GradioChat:
             response_stream = self.model.generate_response(prompt)
             yield from response_stream
-        chat_interface = gr.ChatInterface(
-            chat_fn,
-            textbox=gr.Textbox(placeholder="Ask me something...", container=False),
-            additional_inputs=[
-                gr.Dropdown(
-                    choices=self.model_options,
-                    value=self.current_model_name,
-                    label="Select Gemma Model",
-                ),
-                gr.Dropdown(
-                    choices=self.task_options,
-                    value=self.current_task_name,
-                    label="Select Task",
-                ),
             ],
-        )
-        chat_interface.launch()
     def run(self):
         self._chat()

             response_stream = self.model.generate_response(prompt)
             yield from response_stream
+        # Examples for each task type
+        examples = {
+            "Question Answering": [
+                "What is quantum computing?",
+                "How do neural networks work?",
+                "Explain climate change in simple terms.",
             ],
+            "Text Generation": [
+                "Once upon a time in a distant galaxy...",
+                "The abandoned house at the end of the street had...",
+                "In the year 2150, humanity discovered...",
+            ],
+            "Code Completion": [
+                "def fibonacci(n):",
+                "class BinarySearchInAList:",
+                "async def fetch_data(url):",
+            ],
+        }
+        def update_examples(task):
+            return examples.get(task)
+        with gr.Blocks() as demo:
+            with gr.Row():
+                with gr.Column(scale=3):
+                    task_dropdown = gr.Dropdown(
+                        choices=self.task_options,
+                        value=self.current_task_name,
+                        label="Select Task",
+                    )
+                    model_dropdown = gr.Dropdown(
+                        choices=self.model_options,
+                        value=self.current_model_name,
+                        label="Select Gemma Model",
+                    )
+                    chat_interface = gr.ChatInterface(
+                        chat_fn,
+                        additional_inputs=[model_dropdown, task_dropdown],
+                        textbox=gr.Textbox(
+                            placeholder="Ask me something...", container=False
+                        ),
+                    )
+                with gr.Column(scale=1):
+                    gr.Markdown(
+                        """
+                    ## Tips
+                    - First response will be slower (model loading)
+                    - Switching models clears chat history
+                    - For code completion, start with function definition
+                    - Shorter queries work better
+                    - Larger models (7B) need more memory but give better results
+                    """
+                    )
+                    gr.Markdown("## Examples")
+                    examples_list = gr.Examples(
+                        examples=examples[self.current_task_name],
+                        inputs=chat_interface.textbox,
+                    )
+                    # Update examples when task changes
+                    task_dropdown.change(
+                        fn=update_examples,
+                        inputs=task_dropdown,
+                        outputs=examples_list,
+                    )
+        demo.launch()
     def run(self):
         self._chat()

gemmademo/_model.py CHANGED Viewed

@@ -25,22 +25,22 @@ class LlamaCppGemmaModel:
     AVAILABLE_MODELS: Dict[str, Dict] = {
         "gemma-3b": {
             "model_path": "models/gemma-3-1b-it-Q5_K_M.gguf",
-            "repo_id": "bartowski/google_gemma-3-1b-it-GGUF",
             "filename": "google_gemma-3-1b-it-Q5_K_M.gguf",  # Better quantization
             "description": "3B parameters, instruction-tuned (Q5_K_M)",
             "type": "instruct",
         },
         "gemma-2b": {
             "model_path": "models/gemma-2b-it.gguf",
-            "repo_id": "MaziyarPanahi/gemma-2b-it-GGUF",
             "filename": "gemma-2b-it.Q4_K_M.gguf",
             "description": "2B parameters, instruction-tuned",
             "type": "instruct",
         },
         "gemma-7b": {
             "model_path": "models/gemma-7b-it.gguf",
-            "repo_id": "rahuldshetty/gemma-7b-it-gguf-quantized",
-            "filename": "gemma-7b-it-Q4_K_M.gguf",
             "description": "7B parameters in GGUF format",
             "type": "base",
         },

     AVAILABLE_MODELS: Dict[str, Dict] = {
         "gemma-3b": {
             "model_path": "models/gemma-3-1b-it-Q5_K_M.gguf",
+            "repo_id": "bartowski/google_gemma-3-1b-it-GGUF",
             "filename": "google_gemma-3-1b-it-Q5_K_M.gguf",  # Better quantization
             "description": "3B parameters, instruction-tuned (Q5_K_M)",
             "type": "instruct",
         },
         "gemma-2b": {
             "model_path": "models/gemma-2b-it.gguf",
+            "repo_id": "MaziyarPanahi/gemma-2b-it-GGUF",
             "filename": "gemma-2b-it.Q4_K_M.gguf",
             "description": "2B parameters, instruction-tuned",
             "type": "instruct",
         },
         "gemma-7b": {
             "model_path": "models/gemma-7b-it.gguf",
+            "repo_id": "rahuldshetty/gemma-7b-it-gguf-quantized",
+            "filename": "gemma-7b-it-Q4_K_M.gguf",
             "description": "7B parameters in GGUF format",
             "type": "base",
         },

gemmademo/_utils.py DELETED Viewed

@@ -1,7 +0,0 @@
-def huggingface_login(token: str):
-    """
-    Login to Hugging Face using the token
-    """
-    from huggingface_hub import login
-    login(token=token)