Georg4000 commited on
Commit
b580227
ยท
verified ยท
1 Parent(s): 22e000b

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +5 -1
app.py CHANGED
@@ -20,7 +20,11 @@ model_name = "Qwen/Qwen1.5-4B-Chat" # ูŠู…ูƒู†ูƒ ุงุณุชุฎุฏุงู… "google/gemma-2
20
  device = "cuda" if torch.cuda.is_available() else "cpu"
21
 
22
  # ุชุญู…ูŠู„ ุงู„ู†ู…ูˆุฐุฌ ูˆุงู„ู…ุญูˆู„ ู…ุน ุชู‚ู„ูŠู„ ุงู„ุงุณุชู‡ู„ุงูƒ
23
- model = AutoModelForCausalLM.from_pretrained(model_name, device_map="auto", load_in_8bit=True)
 
 
 
 
24
  tokenizer = AutoTokenizer.from_pretrained(model_name)
25
 
26
  # ุฑุฏูˆุฏ ู…ุฎุตุตุฉ
 
20
  device = "cuda" if torch.cuda.is_available() else "cpu"
21
 
22
  # ุชุญู…ูŠู„ ุงู„ู†ู…ูˆุฐุฌ ูˆุงู„ู…ุญูˆู„ ู…ุน ุชู‚ู„ูŠู„ ุงู„ุงุณุชู‡ู„ุงูƒ
23
+ model = AutoModelForCausalLM.from_pretrained(
24
+ model_name,
25
+ torch_dtype=torch.float16,
26
+ device_map="auto"
27
+ )
28
  tokenizer = AutoTokenizer.from_pretrained(model_name)
29
 
30
  # ุฑุฏูˆุฏ ู…ุฎุตุตุฉ