amkyawdev commited on
Commit
41fcec0
·
verified ·
1 Parent(s): d884c01

Upload app.py with huggingface_hub

Browse files
Files changed (1) hide show
  1. app.py +24 -7
app.py CHANGED
@@ -5,7 +5,7 @@ Model: amkyawdev/mm-llm-tiny
5
 
6
  import os
7
  import torch
8
- from transformers import AutoModelForCausalLM, AutoTokenizer, pipeline
9
  import gradio as gr
10
 
11
  # Model name
@@ -14,12 +14,29 @@ MODEL_NAME = "amkyawdev/mm-llm-tiny"
14
  # Load model and tokenizer
15
  print(f"Loading model: {MODEL_NAME}...")
16
 
17
- tokenizer = AutoTokenizer.from_pretrained(MODEL_NAME)
18
- model = AutoModelForCausalLM.from_pretrained(
19
- MODEL_NAME,
20
- torch_dtype=torch.float16,
21
- device_map="auto"
22
- )
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
23
 
24
  # Create pipeline
25
  pipe = pipeline(
 
5
 
6
  import os
7
  import torch
8
+ from transformers import AutoModelForCausalLM, AutoTokenizer, pipeline, AutoConfig
9
  import gradio as gr
10
 
11
  # Model name
 
14
  # Load model and tokenizer
15
  print(f"Loading model: {MODEL_NAME}...")
16
 
17
+ try:
18
+ tokenizer = AutoTokenizer.from_pretrained(MODEL_NAME)
19
+
20
+ # Try with device_map first
21
+ model = AutoModelForCausalLM.from_pretrained(
22
+ MODEL_NAME,
23
+ torch_dtype=torch.float16,
24
+ device_map="auto",
25
+ low_cpu_mem_usage=True
26
+ )
27
+
28
+ print("Model loaded on GPU!")
29
+
30
+ except Exception as e:
31
+ print(f"GPU failed: {e}, trying CPU...")
32
+ tokenizer = AutoTokenizer.from_pretrained(MODEL_NAME)
33
+ model = AutoModelForCausalLM.from_pretrained(
34
+ MODEL_NAME,
35
+ torch_dtype=torch.float32,
36
+ low_cpu_mem_usage=True
37
+ )
38
+ model = model.to("cpu")
39
+ print("Model loaded on CPU!")
40
 
41
  # Create pipeline
42
  pipe = pipeline(