Spaces:

Rhulli
/

Timex3Normalitation

Sleeping

Rhulli commited on Jun 18, 2025

Commit

bcbefbd

verified ·

1 Parent(s): b8348c3

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -10,7 +10,6 @@ from transformers import (
     AutoTokenizer,
     AutoModelForTokenClassification,
     AutoModelForCausalLM,
-    BitsAndBytesConfig,
 )
 from peft import PeftModel
@@ -37,13 +36,6 @@ ID2LABEL    = {0: "O", 1: "B-TIMEX", 2: "I-TIMEX"}
 BASE_ID     = "google/gemma-2b-it"
 ADAPTER_ID  = "Rhulli/gemma-2b-it-TIMEX3"
-# --- Configuración de cuantización para el modelo de normalización ---
-quant_config = BitsAndBytesConfig(
-    load_in_4bit=True,
-    bnb_4bit_quant_type="nf4",
-    bnb_4bit_compute_dtype=torch.float16,
-)
 # --- Leer el token del entorno (añadido como Repository Secret) ---
 HF_TOKEN = os.getenv("HF_TOKEN")
@@ -55,13 +47,14 @@ def load_models():
     if torch.cuda.is_available():
         ner_mod.to("cuda")
-    # Carga del modelo de normalización (LoRA + 4bit)
     base_mod = AutoModelForCausalLM.from_pretrained(
         BASE_ID,
-        quantization_config=quant_config,
         device_map="auto",
         token=HF_TOKEN
     )
     norm_tok = AutoTokenizer.from_pretrained(ADAPTER_ID, use_fast=True, token=HF_TOKEN)
     norm_mod = PeftModel.from_pretrained(
         base_mod,

     AutoTokenizer,
     AutoModelForTokenClassification,
     AutoModelForCausalLM,
 )
 from peft import PeftModel
 BASE_ID     = "google/gemma-2b-it"
 ADAPTER_ID  = "Rhulli/gemma-2b-it-TIMEX3"
 # --- Leer el token del entorno (añadido como Repository Secret) ---
 HF_TOKEN = os.getenv("HF_TOKEN")
     if torch.cuda.is_available():
         ner_mod.to("cuda")
+    # Carga del modelo base de normalización (sin cuantización)
     base_mod = AutoModelForCausalLM.from_pretrained(
         BASE_ID,
         device_map="auto",
         token=HF_TOKEN
     )
+    # Carga del tokenizer y adaptador LoRA
     norm_tok = AutoTokenizer.from_pretrained(ADAPTER_ID, use_fast=True, token=HF_TOKEN)
     norm_mod = PeftModel.from_pretrained(
         base_mod,