Spaces:

ahmedembedded
/

AskFAST

Runtime error

ahmedembedded commited on Aug 4, 2024

Commit

a504372

verified ·

1 Parent(s): 90a91f4

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,14 +1,14 @@
 import gradio as gr
 from peft import AutoPeftModelForCausalLM
-from transformers import AutoTokenizer
 import torch
 # Load the model and tokenizer
 model_name = "ahmedembedded/AskFAST"
-load_in_4bit = True
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
-model = AutoPeftModelForCausalLM.from_pretrained(model_name, load_in_4bit=load_in_4bit).to(device)
 tokenizer = AutoTokenizer.from_pretrained(model_name)
 # Define the prompt context

 import gradio as gr
 from peft import AutoPeftModelForCausalLM
+from transformers import AutoTokenizer, BitsAndBytesConfig
 import torch
 # Load the model and tokenizer
 model_name = "ahmedembedded/AskFAST"
+quantization_config = BitsAndBytesConfig(load_in_4bit=True)
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+model = AutoPeftModelForCausalLM.from_pretrained(model_name, quantization_config=quantization_config).to(device)
 tokenizer = AutoTokenizer.from_pretrained(model_name)
 # Define the prompt context