Spaces:

TheMaisk
/

TheMaisk_tinychat1b

Sleeping

App Files Files Community

TheMaisk commited on Jan 9, 2024

Commit

eefd049

1 Parent(s): fca2eb7

Update app.py

Browse files

Files changed (1) hide show

app.py +7 -7

app.py CHANGED Viewed

@@ -11,17 +11,17 @@ def generate(
     temperature=0.4,
     top_p=0.95,
     top_k=50,
-    max_new_tokens=2000,
 ):
     pipe = load_model(model_name)
-    # Need to add additional options later.
     if template_name == "Falcon 1B Template":
         message_template = [
             {"role": "user", "content": "Hello!"},
             {"role": "assistant", "content": "Hello! How can I assist you today?"},
             {"role": "user", "content": user_input},
         ]
-    else:  # Default to "TinyLlama Template"
         message_template = [
             {
                 "role": "system",
@@ -30,7 +30,6 @@ def generate(
             {"role": "user", "content": user_input},
         ]
-    # Set tokenize correctly. Otherwise ticking the box breaks it.
     prompt = pipe.tokenizer.apply_chat_template(message_template, tokenize=False, add_generation_prompt=True)
     outputs = pipe(prompt, max_new_tokens=max_new_tokens, do_sample=True,
                    temperature=temperature, top_k=top_k, top_p=top_p, repetition_penalty=1.10)
@@ -38,7 +37,7 @@ def generate(
 model_choices = ["TinyLlama/TinyLlama-1.1B-Chat-v1.0", "ericzzz/falcon-rw-1b-chat"]
 template_choices = ["TinyLlama Template", "Falcon Template"]
-# What at the best options?
 g = gr.Interface(
     fn=generate,
     inputs=[
@@ -48,12 +47,13 @@ g = gr.Interface(
         gr.components.Slider(minimum=0, maximum=1, value=0.4, label="Temperature"),
         gr.components.Slider(minimum=0, maximum=1, value=0.95, label="Top p"),
         gr.components.Slider(minimum=0, maximum=100, step=1, value=50, label="Top k"),
-        gr.components.Slider(minimum=1, maximum=1024, step=1, value=2000, label="Max tokens"),
     ],
     outputs=[gr.Textbox(lines=10, label="Output")],
     title="Hugging Face Transformers Model",
     description="A simple interface for generating text with a Hugging Face Transformers model.",
     concurrency_limit=1
 )
-g.launch(max_threads=2)

     temperature=0.4,
     top_p=0.95,
     top_k=50,
+    max_new_tokens=256,
 ):
     pipe = load_model(model_name)
+    # Hier weitere Optionen hinzufügen
     if template_name == "Falcon 1B Template":
         message_template = [
             {"role": "user", "content": "Hello!"},
             {"role": "assistant", "content": "Hello! How can I assist you today?"},
             {"role": "user", "content": user_input},
         ]
+    else:  # Standardmäßig "TinyLlama Template"
         message_template = [
             {
                 "role": "system",
             {"role": "user", "content": user_input},
         ]
     prompt = pipe.tokenizer.apply_chat_template(message_template, tokenize=False, add_generation_prompt=True)
     outputs = pipe(prompt, max_new_tokens=max_new_tokens, do_sample=True,
                    temperature=temperature, top_k=top_k, top_p=top_p, repetition_penalty=1.10)
 model_choices = ["TinyLlama/TinyLlama-1.1B-Chat-v1.0", "ericzzz/falcon-rw-1b-chat"]
 template_choices = ["TinyLlama Template", "Falcon Template"]
 g = gr.Interface(
     fn=generate,
     inputs=[
         gr.components.Slider(minimum=0, maximum=1, value=0.4, label="Temperature"),
         gr.components.Slider(minimum=0, maximum=1, value=0.95, label="Top p"),
         gr.components.Slider(minimum=0, maximum=100, step=1, value=50, label="Top k"),
+        gr.components.Slider(minimum=1, maximum=1024, step=1, value=256, label="Max tokens"),
     ],
     outputs=[gr.Textbox(lines=10, label="Output")],
     title="Hugging Face Transformers Model",
     description="A simple interface for generating text with a Hugging Face Transformers model.",
+    theme='syddharth/gray-minimal',  # Hinzugefügtes Theme
     concurrency_limit=1
 )
+g.launch(max_threads=2)