Spaces:
Sleeping
Sleeping
bits
Browse files- Dockerfile +2 -0
- app/model_loader.py +2 -1
- requirements.txt +1 -0
Dockerfile
CHANGED
|
@@ -5,6 +5,8 @@ WORKDIR /code
|
|
| 5 |
COPY ./requirements.txt /code/requirements.txt
|
| 6 |
|
| 7 |
RUN pip install --no-cache-dir --upgrade -r /code/requirements.txt
|
|
|
|
|
|
|
| 8 |
|
| 9 |
RUN useradd -m -u 1000 user
|
| 10 |
|
|
|
|
| 5 |
COPY ./requirements.txt /code/requirements.txt
|
| 6 |
|
| 7 |
RUN pip install --no-cache-dir --upgrade -r /code/requirements.txt
|
| 8 |
+
RUN apt-get update && apt-get install -y libbitsandbytes-dev
|
| 9 |
+
|
| 10 |
|
| 11 |
RUN useradd -m -u 1000 user
|
| 12 |
|
app/model_loader.py
CHANGED
|
@@ -20,7 +20,8 @@ def load_model():
|
|
| 20 |
use_auth_token=hf_token,
|
| 21 |
cache_dir="/tmp/hf_cache",
|
| 22 |
torch_dtype="auto",
|
| 23 |
-
device_map="auto"
|
|
|
|
| 24 |
)
|
| 25 |
model = PeftModel.from_pretrained(
|
| 26 |
base_model,
|
|
|
|
| 20 |
use_auth_token=hf_token,
|
| 21 |
cache_dir="/tmp/hf_cache",
|
| 22 |
torch_dtype="auto",
|
| 23 |
+
device_map="auto",
|
| 24 |
+
load_in_8bit=True # <-- Try enabling 8-bit
|
| 25 |
)
|
| 26 |
model = PeftModel.from_pretrained(
|
| 27 |
base_model,
|
requirements.txt
CHANGED
|
@@ -5,3 +5,4 @@ torch
|
|
| 5 |
accelerate
|
| 6 |
fastapi
|
| 7 |
uvicorn
|
|
|
|
|
|
| 5 |
accelerate
|
| 6 |
fastapi
|
| 7 |
uvicorn
|
| 8 |
+
bitsandbytes
|