Amish Kushwaha commited on
Commit
ae29859
·
1 Parent(s): 8ae2c46

Disable 4-bit quantization for the model

Browse files
Files changed (1) hide show
  1. app.py +6 -1
app.py CHANGED
@@ -3,7 +3,12 @@ from pydantic import BaseModel
3
  from transformers import pipeline
4
 
5
  # Load your Hugging Face model
6
- model = pipeline("text-generation", model="devops-bda/Abap")
 
 
 
 
 
7
 
8
  # Initialize FastAPI app
9
  app = FastAPI()
 
3
  from transformers import pipeline
4
 
5
  # Load your Hugging Face model
6
+ # model = pipeline("text-generation", model="devops-bda/Abap")
7
+ model = pipeline(
8
+ "text-generation",
9
+ model="devops-bda/Abap",
10
+ model_kwargs={"load_in_4bit": False} # Disable 4-bit quantization
11
+ )
12
 
13
  # Initialize FastAPI app
14
  app = FastAPI()