NoeMartinezSanchez commited on
Commit
e80ce4c
·
1 Parent(s): 26ec9f1

eliminacion del timeout

Browse files
Files changed (1) hide show
  1. models/gemma_wrapper.py +10 -7
models/gemma_wrapper.py CHANGED
@@ -92,27 +92,27 @@ class GemmaWrapper:
92
  loaded = False
93
  last_error = None
94
 
95
- for model_variant in MODEL_VARIANTS:
96
- if model_variant != MODEL_VARIANTS[0] and not loaded:
97
  logger.info(f"Trying fallback model: {model_variant}")
98
 
99
  try:
100
  logger.info(f"Loading tokenizer from {model_variant}...")
 
101
  self.tokenizer = AutoTokenizer.from_pretrained(
102
  model_variant,
103
  cache_dir=self.cache_dir,
104
  token=hf_token,
105
- timeout=300,
106
  trust_remote_code=True,
107
- force_download=True,
108
  )
 
109
 
110
  if self.tokenizer.pad_token is None:
111
  self.tokenizer.pad_token = self.tokenizer.eos_token
112
  logger.info("Set pad_token = eos_token")
113
 
114
  logger.info(f"Loading model from {model_variant}...")
115
- logger.info("Model size: ~4-5 GB. Using 300s timeout for download.")
116
  model_start = time.time()
117
 
118
  self.model = AutoModelForCausalLM.from_pretrained(
@@ -121,9 +121,7 @@ class GemmaWrapper:
121
  torch_dtype=torch.float32,
122
  cache_dir=self.cache_dir,
123
  token=hf_token,
124
- timeout=300,
125
  trust_remote_code=True,
126
- force_download=True,
127
  )
128
 
129
  model_time = time.time() - model_start
@@ -137,6 +135,11 @@ class GemmaWrapper:
137
  logger.error(f"KeyError loading {model_variant}: {e}")
138
  last_error = e
139
  continue
 
 
 
 
 
140
  except Exception as e:
141
  logger.error(f"Error loading {model_variant}: {str(e)}")
142
  last_error = e
 
92
  loaded = False
93
  last_error = None
94
 
95
+ for i, model_variant in enumerate(MODEL_VARIANTS):
96
+ if i > 0:
97
  logger.info(f"Trying fallback model: {model_variant}")
98
 
99
  try:
100
  logger.info(f"Loading tokenizer from {model_variant}...")
101
+ download_start = time.time()
102
  self.tokenizer = AutoTokenizer.from_pretrained(
103
  model_variant,
104
  cache_dir=self.cache_dir,
105
  token=hf_token,
 
106
  trust_remote_code=True,
 
107
  )
108
+ logger.info(f"Tokenizer downloaded in {time.time() - download_start:.1f}s")
109
 
110
  if self.tokenizer.pad_token is None:
111
  self.tokenizer.pad_token = self.tokenizer.eos_token
112
  logger.info("Set pad_token = eos_token")
113
 
114
  logger.info(f"Loading model from {model_variant}...")
115
+ logger.info("Model size: ~4-5 GB, may take several minutes...")
116
  model_start = time.time()
117
 
118
  self.model = AutoModelForCausalLM.from_pretrained(
 
121
  torch_dtype=torch.float32,
122
  cache_dir=self.cache_dir,
123
  token=hf_token,
 
124
  trust_remote_code=True,
 
125
  )
126
 
127
  model_time = time.time() - model_start
 
135
  logger.error(f"KeyError loading {model_variant}: {e}")
136
  last_error = e
137
  continue
138
+ except TypeError as e:
139
+ if "timeout" in str(e):
140
+ logger.error(f"timeout parameter not supported in {model_variant}: {e}")
141
+ last_error = e
142
+ continue
143
  except Exception as e:
144
  logger.error(f"Error loading {model_variant}: {str(e)}")
145
  last_error = e