BoostedJonP commited on
Commit
c7aa5b3
·
1 Parent(s): 25ab7b8

removed bnb config

Browse files
Files changed (1) hide show
  1. app.py +1 -10
app.py CHANGED
@@ -1,6 +1,6 @@
1
  import gradio as gr
2
  import torch
3
- from transformers import AutoTokenizer, AutoModelForCausalLM, BitsAndBytesConfig
4
  from functools import lru_cache
5
  import logging
6
 
@@ -11,14 +11,6 @@ logger = logging.getLogger(__name__)
11
  logging.basicConfig(level=logging.INFO)
12
  logger.info("Starting Jerome Powell AI Assistant...")
13
 
14
-
15
- QUANTIZATION_CONFIG = BitsAndBytesConfig(
16
- load_in_4bit=True,
17
- bnb_4bit_quant_type="nf4",
18
- bnb_4bit_use_double_quant=True,
19
- bnb_4bit_compute_dtype="float16",
20
- )
21
-
22
  MODEL_NAME = "BoostedJonP/powell-phi3-mini"
23
 
24
 
@@ -36,7 +28,6 @@ def load_model():
36
  model = AutoModelForCausalLM.from_pretrained(
37
  MODEL_NAME,
38
  trust_remote_code=True,
39
- quantization_config=QUANTIZATION_CONFIG,
40
  device_map="auto",
41
  attn_implementation="eager",
42
  use_cache=True,
 
1
  import gradio as gr
2
  import torch
3
+ from transformers import AutoTokenizer, AutoModelForCausalLM
4
  from functools import lru_cache
5
  import logging
6
 
 
11
  logging.basicConfig(level=logging.INFO)
12
  logger.info("Starting Jerome Powell AI Assistant...")
13
 
 
 
 
 
 
 
 
 
14
  MODEL_NAME = "BoostedJonP/powell-phi3-mini"
15
 
16
 
 
28
  model = AutoModelForCausalLM.from_pretrained(
29
  MODEL_NAME,
30
  trust_remote_code=True,
 
31
  device_map="auto",
32
  attn_implementation="eager",
33
  use_cache=True,