Update app.py
Browse files
app.py
CHANGED
|
@@ -33,8 +33,6 @@ def load_model():
|
|
| 33 |
"device_map": "auto",
|
| 34 |
"trust_remote_code": True,
|
| 35 |
"low_cpu_mem_usage": True,
|
| 36 |
-
"offload_folder": "offload",
|
| 37 |
-
"offload_state_dict": True,
|
| 38 |
}
|
| 39 |
|
| 40 |
# Use 8-bit quantization if enabled (saves memory)
|
|
@@ -55,7 +53,6 @@ def load_model():
|
|
| 55 |
model = PeftModel.from_pretrained(
|
| 56 |
base_model,
|
| 57 |
MODEL_REPO,
|
| 58 |
-
offload_folder="offload", # Enable disk offloading for adapter too
|
| 59 |
)
|
| 60 |
except TypeError as e:
|
| 61 |
if "unexpected keyword argument" in str(e):
|
|
@@ -97,7 +94,6 @@ def load_model():
|
|
| 97 |
model = PeftModel.from_pretrained(
|
| 98 |
base_model,
|
| 99 |
temp_dir,
|
| 100 |
-
offload_folder="offload"
|
| 101 |
)
|
| 102 |
|
| 103 |
# Cleanup
|
|
|
|
| 33 |
"device_map": "auto",
|
| 34 |
"trust_remote_code": True,
|
| 35 |
"low_cpu_mem_usage": True,
|
|
|
|
|
|
|
| 36 |
}
|
| 37 |
|
| 38 |
# Use 8-bit quantization if enabled (saves memory)
|
|
|
|
| 53 |
model = PeftModel.from_pretrained(
|
| 54 |
base_model,
|
| 55 |
MODEL_REPO,
|
|
|
|
| 56 |
)
|
| 57 |
except TypeError as e:
|
| 58 |
if "unexpected keyword argument" in str(e):
|
|
|
|
| 94 |
model = PeftModel.from_pretrained(
|
| 95 |
base_model,
|
| 96 |
temp_dir,
|
|
|
|
| 97 |
)
|
| 98 |
|
| 99 |
# Cleanup
|