Spaces:

Ctaake
/

FranziBot2

Sleeping

Ctaake commited on Apr 13, 2024

Commit

88db26a

verified ·

1 Parent(s): 2a8b052

Switch nous research

Files changed (1) hide show

app.py CHANGED Viewed

@@ -10,12 +10,13 @@ from datetime import datetime
 checkpoint = "CohereForAI/c4ai-command-r-v01"
 checkpoint = "mistralai/Mistral-7B-Instruct-v0.1"
 checkpoint = "google/gemma-1.1-7b-it"
 path_to_log = "FlaggedFalse.txt"
 # Inference client with the model (And HF-token if needed)
 client = InferenceClient(checkpoint)
 tokenizer = AutoTokenizer.from_pretrained(checkpoint)
-if checkpoint == "mistralai/Mistral-7B-Instruct-v0.1":
     # Tokenizer chat template correction(Only works for mistral models)
     chat_template = open("mistral-instruct.jinja").read()
     chat_template = chat_template.replace('    ', '').replace('\n', '')
@@ -58,7 +59,7 @@ def inference(message, history, systemPrompt=SYSTEM_PROMPT+SYSTEM_PROMPT_PLUS, t
         seed=random.randint(0, 999999999),
     )
     # Generating the response by passing the prompt in right format plus the client settings
-    stream = client.text_generation(format_prompt_gemma(message, history, systemPrompt),
                                     **client_settings)
     # Reading the stream
     partial_response = ""

 checkpoint = "CohereForAI/c4ai-command-r-v01"
 checkpoint = "mistralai/Mistral-7B-Instruct-v0.1"
 checkpoint = "google/gemma-1.1-7b-it"
+checkpoint = "NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO"
 path_to_log = "FlaggedFalse.txt"
 # Inference client with the model (And HF-token if needed)
 client = InferenceClient(checkpoint)
 tokenizer = AutoTokenizer.from_pretrained(checkpoint)
+if checkpoint == "NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO":
     # Tokenizer chat template correction(Only works for mistral models)
     chat_template = open("mistral-instruct.jinja").read()
     chat_template = chat_template.replace('    ', '').replace('\n', '')
         seed=random.randint(0, 999999999),
     )
     # Generating the response by passing the prompt in right format plus the client settings
+    stream = client.text_generation(format_prompt(message, history, systemPrompt),
                                     **client_settings)
     # Reading the stream
     partial_response = ""