Spaces:

dar-tau
/

selfie

Sleeping

App Files Files Community

dar-tau commited on Apr 11, 2024

Commit

e048966

verified ·

1 Parent(s): 655bead

Update configs.py

Browse files

Files changed (1) hide show

configs.py +24 -18

configs.py CHANGED Viewed

@@ -27,22 +27,29 @@ model_info = {
                       original_prompt_template='<s>{prompt}',
                       interpretation_prompt_template='<s>[INST] [X] [/INST] {prompt}',
                       layers_format=llama_layers_format),
     'Mixtral 8x7B Instruct (Experimental)': dict(model_path='TheBloke/Mixtral-8x7B-Instruct-v0.1-AWQ',
                                   token=os.environ['hf_token'], wait_with_hidden_states=True,
                                   original_prompt_template='<s>{prompt}',
                                   interpretation_prompt_template='<s>[INST] [X] [/INST] {prompt}',
                                   layers_format=llama_layers_format
                                  ),
-    'CodeLLAMA 70B Instruct (Experimental)': dict(model_path='TheBloke/CodeLlama-70B-Instruct-GPTQ',
-                                   token=os.environ['hf_token'],
-                                   wait_with_hidden_states=True, dont_cuda=True, device_map='cuda', # disable_exllama=True,
-                                   original_prompt_template='<s>{prompt}',
-                                   interpretation_prompt_template='<s>[INST] [X] [/INST] {prompt}',
-                                   layers_format=llama_layers_format
-                                  ),
-    'GPT-2 Small': dict(model_path='gpt2', original_prompt_template='{prompt}',
-                     interpretation_prompt_template='User: [X]\n\nAnswer: {prompt}',
-                     layers_format=gpt_layers_format),
     # 'GPT-2 Medium': dict(model_path='gpt2-medium', original_prompt_template='{prompt}',
     #                  interpretation_prompt_template='User: [X]\n\nAnswer: {prompt}',
     #                  layers_format=gpt_layers_format),
@@ -52,14 +59,13 @@ model_info = {
     # 'GPT-2 XL': dict(model_path='gpt2-xl', original_prompt_template='{prompt}',
     #                  interpretation_prompt_template='User: [X]\n\nAnswer: {prompt}',
     #                  layers_format=gpt_layers_format),
-    'GPT-J 6B': dict(model_path='EleutherAI/gpt-j-6b', original_prompt_template='{prompt}',
-                     interpretation_prompt_template='User: [X]\n\nAnswer: {prompt}',
-                     layers_format=gpt_layers_format),
-    'Mistral-7B Instruct': dict(model_path='mistralai/Mistral-7B-Instruct-v0.2', device_map='cpu',
-                                original_prompt_template='<s>{prompt}',
-                                interpretation_prompt_template='<s>[INST] [X] [/INST] {prompt}',
-                                layers_format=llama_layers_format),
     # 'Gemma-2B': dict(model_path='google/gemma-2b', device_map='cpu', token=os.environ['hf_token'],
     #                         original_prompt_template='<bos>{prompt}',
     #                         interpretation_prompt_template='<bos>User: [X]\n\nAnswer: {prompt}',

                       original_prompt_template='<s>{prompt}',
                       interpretation_prompt_template='<s>[INST] [X] [/INST] {prompt}',
                       layers_format=llama_layers_format),
+    'GPT-J 6B': dict(model_path='EleutherAI/gpt-j-6b', original_prompt_template='{prompt}',
+                     interpretation_prompt_template='User: [X]\n\nAnswer: {prompt}',
+                     layers_format=gpt_layers_format),
+    'Mistral-7B Instruct': dict(model_path='mistralai/Mistral-7B-Instruct-v0.2', device_map='cpu',
+                                original_prompt_template='<s>{prompt}',
+                                interpretation_prompt_template='<s>[INST] [X] [/INST] {prompt}',
+                                layers_format=llama_layers_format),
+    'GPT-2 Small': dict(model_path='gpt2', original_prompt_template='{prompt}',
+                     interpretation_prompt_template='User: [X]\n\nAnswer: {prompt}',
+                     layers_format=gpt_layers_format),
     'Mixtral 8x7B Instruct (Experimental)': dict(model_path='TheBloke/Mixtral-8x7B-Instruct-v0.1-AWQ',
                                   token=os.environ['hf_token'], wait_with_hidden_states=True,
                                   original_prompt_template='<s>{prompt}',
                                   interpretation_prompt_template='<s>[INST] [X] [/INST] {prompt}',
                                   layers_format=llama_layers_format
                                  ),
+    'Wizard Vicuna 30B Uncensored (Experimental)': dict(model_path='TheBloke/Wizard-Vicuna-30B-Uncensored-GPTQ',
+                                                        token=os.environ['hf_token'],
+                                                        wait_with_hidden_states=True, dont_cuda=True, device_map='cuda',
+                                                        original_prompt_template='<s>USER: {prompt}',
+                                                        interpretation_prompt_template='<s>USER: [X] ASSISTANT: {prompt}',
+                                                        layers_format=llama_layers_format
+                                                       ),
     # 'GPT-2 Medium': dict(model_path='gpt2-medium', original_prompt_template='{prompt}',
     #                  interpretation_prompt_template='User: [X]\n\nAnswer: {prompt}',
     #                  layers_format=gpt_layers_format),
     # 'GPT-2 XL': dict(model_path='gpt2-xl', original_prompt_template='{prompt}',
     #                  interpretation_prompt_template='User: [X]\n\nAnswer: {prompt}',
     #                  layers_format=gpt_layers_format),
+    # 'CodeLLAMA 70B Instruct (Experimental)': dict(model_path='TheBloke/CodeLlama-70B-Instruct-GPTQ',
+    #                                token=os.environ['hf_token'],
+    #                                wait_with_hidden_states=True, dont_cuda=True, device_map='cuda', # disable_exllama=True,
+    #                                original_prompt_template='<s>{prompt}',
+    #                                interpretation_prompt_template='<s>[INST] [X] [/INST] {prompt}',
+    #                                layers_format=llama_layers_format
+    #                               ),
     # 'Gemma-2B': dict(model_path='google/gemma-2b', device_map='cpu', token=os.environ['hf_token'],
     #                         original_prompt_template='<bos>{prompt}',
     #                         interpretation_prompt_template='<bos>User: [X]\n\nAnswer: {prompt}',