Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
|
@@ -11,13 +11,13 @@ class RAGChatbot:
|
|
| 11 |
embedding_model="all-MiniLM-L6-v2"):
|
| 12 |
# Initialize tokenizer and model
|
| 13 |
self.tokenizer = AutoTokenizer.from_pretrained(model_name)
|
| 14 |
-
self.bnb_config = BitsAndBytesConfig(
|
| 15 |
-
|
| 16 |
-
|
| 17 |
-
|
| 18 |
self.model = AutoModelForCausalLM.from_pretrained(
|
| 19 |
model_name,
|
| 20 |
-
|
| 21 |
device_map="auto"
|
| 22 |
)
|
| 23 |
|
|
|
|
| 11 |
embedding_model="all-MiniLM-L6-v2"):
|
| 12 |
# Initialize tokenizer and model
|
| 13 |
self.tokenizer = AutoTokenizer.from_pretrained(model_name)
|
| 14 |
+
# self.bnb_config = BitsAndBytesConfig(
|
| 15 |
+
# load_in_8bit=True, # Enable 8-bit loading
|
| 16 |
+
# llm_int8_threshold=6.0, # Threshold for mixed-precision computation
|
| 17 |
+
# )
|
| 18 |
self.model = AutoModelForCausalLM.from_pretrained(
|
| 19 |
model_name,
|
| 20 |
+
torch_dtype=torch.bfloat16, ,
|
| 21 |
device_map="auto"
|
| 22 |
)
|
| 23 |
|