MGZON commited on
Commit
da159d9
·
verified ·
1 Parent(s): fca51d8

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +8 -6
app.py CHANGED
@@ -26,21 +26,23 @@ app = FastAPI(
26
  async def health_check():
27
  return {"status": "healthy"}
28
 
29
- # Load T5 model from Hub
30
  T5_REPO = "MGZON/mgzon-flan-t5-base"
31
  try:
32
- logger.info(f"Loading tokenizer for {T5_REPO} with HF_TOKEN")
33
  t5_tokenizer = AutoTokenizer.from_pretrained(
34
  T5_REPO,
35
  cache_dir=CACHE_DIR,
36
- use_auth_token=os.environ.get("HF_TOKEN")
 
37
  )
38
  logger.info(f"Successfully loaded tokenizer for {T5_REPO}")
39
- logger.info(f"Loading model for {T5_REPO}")
40
  t5_model = AutoModelForSeq2SeqLM.from_pretrained(
41
  T5_REPO,
42
  cache_dir=CACHE_DIR,
43
- use_auth_token=os.environ.get("HF_TOKEN")
 
44
  )
45
  logger.info(f"Successfully loaded model for {T5_REPO}")
46
  except Exception as e:
@@ -101,4 +103,4 @@ def ask(req: AskRequest):
101
  return {"model": model_name, "response": answer}
102
  except Exception as e:
103
  logger.error(f"Error processing request: {str(e)}")
104
- raise HTTPException(status_code=500, detail=f"خطأ أثناء معالجة الطلب: {str(e)}")
 
26
  async def health_check():
27
  return {"status": "healthy"}
28
 
29
+ # Load T5 model from local cache
30
  T5_REPO = "MGZON/mgzon-flan-t5-base"
31
  try:
32
+ logger.info(f"Loading tokenizer for {T5_REPO} from local cache")
33
  t5_tokenizer = AutoTokenizer.from_pretrained(
34
  T5_REPO,
35
  cache_dir=CACHE_DIR,
36
+ use_auth_token=os.environ.get("HF_TOKEN"),
37
+ local_files_only=True
38
  )
39
  logger.info(f"Successfully loaded tokenizer for {T5_REPO}")
40
+ logger.info(f"Loading model for {T5_REPO} from local cache")
41
  t5_model = AutoModelForSeq2SeqLM.from_pretrained(
42
  T5_REPO,
43
  cache_dir=CACHE_DIR,
44
+ use_auth_token=os.environ.get("HF_TOKEN"),
45
+ local_files_only=True
46
  )
47
  logger.info(f"Successfully loaded model for {T5_REPO}")
48
  except Exception as e:
 
103
  return {"model": model_name, "response": answer}
104
  except Exception as e:
105
  logger.error(f"Error processing request: {str(e)}")
106
+ raise HTTPException(status_code=500, detail=f"خطأ أثناء معالجة الطلب: {str(e)}")