alsojulha commited on
Commit
7025d17
·
verified ·
1 Parent(s): 3239f01

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +6 -1
app.py CHANGED
@@ -10,7 +10,12 @@ from langchain_community.document_loaders import PyMuPDFLoader
10
  # Configurações do modelo
11
  MODEL_PATH = "numind/NuExtract-1.5-tiny"
12
  tokenizer = AutoTokenizer.from_pretrained(MODEL_PATH)
13
- model = AutoModelForCausalLM.from_pretrained(MODEL_PATH, torch_dtype=torch.float32)
 
 
 
 
 
14
 
15
  # Constantes
16
  MAX_INPUT_SIZE = 4000
 
10
  # Configurações do modelo
11
  MODEL_PATH = "numind/NuExtract-1.5-tiny"
12
  tokenizer = AutoTokenizer.from_pretrained(MODEL_PATH)
13
+ device = "cuda"
14
+ model = AutoModelForCausalLM.from_pretrained(
15
+ MODEL_PATH,
16
+ torch_dtype=torch.float16 # Usa FP16 para reduzir o uso de VRAM
17
+ ).to(device)
18
+ torch.cuda.empty_cache()
19
 
20
  # Constantes
21
  MAX_INPUT_SIZE = 4000