AndaiMD commited on
Commit
7b23d6d
·
1 Parent(s): 71681f4
Files changed (3) hide show
  1. Dockerfile +2 -0
  2. app/model_loader.py +2 -1
  3. requirements.txt +1 -0
Dockerfile CHANGED
@@ -5,6 +5,8 @@ WORKDIR /code
5
  COPY ./requirements.txt /code/requirements.txt
6
 
7
  RUN pip install --no-cache-dir --upgrade -r /code/requirements.txt
 
 
8
 
9
  RUN useradd -m -u 1000 user
10
 
 
5
  COPY ./requirements.txt /code/requirements.txt
6
 
7
  RUN pip install --no-cache-dir --upgrade -r /code/requirements.txt
8
+ RUN apt-get update && apt-get install -y libbitsandbytes-dev
9
+
10
 
11
  RUN useradd -m -u 1000 user
12
 
app/model_loader.py CHANGED
@@ -20,7 +20,8 @@ def load_model():
20
  use_auth_token=hf_token,
21
  cache_dir="/tmp/hf_cache",
22
  torch_dtype="auto",
23
- device_map="auto"
 
24
  )
25
  model = PeftModel.from_pretrained(
26
  base_model,
 
20
  use_auth_token=hf_token,
21
  cache_dir="/tmp/hf_cache",
22
  torch_dtype="auto",
23
+ device_map="auto",
24
+ load_in_8bit=True # <-- Try enabling 8-bit
25
  )
26
  model = PeftModel.from_pretrained(
27
  base_model,
requirements.txt CHANGED
@@ -5,3 +5,4 @@ torch
5
  accelerate
6
  fastapi
7
  uvicorn
 
 
5
  accelerate
6
  fastapi
7
  uvicorn
8
+ bitsandbytes