warleagle commited on
Commit
92ca8d9
·
verified ·
1 Parent(s): 34306e9

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -2
app.py CHANGED
@@ -9,7 +9,7 @@ MODEL_NAME = "warleagle/medical_chat_saiga"
9
  config = PeftConfig.from_pretrained(MODEL_NAME)
10
  model = AutoModelForCausalLM.from_pretrained(
11
  config.base_model_name_or_path,
12
- load_in_4bit=True,
13
  torch_dtype=torch.float16,
14
  device_map="auto"
15
  )
@@ -42,7 +42,7 @@ def predict(input_data, temp):
42
 
43
  conversation = Conversation()
44
  conversation.add_user_message(input_data)
45
- prompt = conversation.get_prompt(tokenizer)
46
 
47
  output = generate(model, tokenizer, prompt, generation_config)
48
  return output
 
9
  config = PeftConfig.from_pretrained(MODEL_NAME)
10
  model = AutoModelForCausalLM.from_pretrained(
11
  config.base_model_name_or_path,
12
+ load_in_8bit=True,
13
  torch_dtype=torch.float16,
14
  device_map="auto"
15
  )
 
42
 
43
  conversation = Conversation()
44
  conversation.add_user_message(input_data)
45
+ prompt = conversation.get_prompt()
46
 
47
  output = generate(model, tokenizer, prompt, generation_config)
48
  return output