Spaces:
Sleeping
Sleeping
Commit
·
3948567
1
Parent(s):
712d810
Initial commit
Browse files
app.py
CHANGED
|
@@ -20,15 +20,15 @@ if not hf_token:
|
|
| 20 |
login(token=hf_token)
|
| 21 |
logger.debug("Hugging Face login successful")
|
| 22 |
|
| 23 |
-
# لود مدل
|
| 24 |
-
logger.debug("Loading
|
| 25 |
try:
|
| 26 |
-
tokenizer = AutoTokenizer.from_pretrained("
|
| 27 |
-
model = AutoModelForCausalLM.from_pretrained("
|
| 28 |
code_gen = pipeline("text-generation", model=model, tokenizer=tokenizer, max_new_tokens=512, temperature=0.6, top_p=0.95)
|
| 29 |
-
logger.debug("
|
| 30 |
except Exception as e:
|
| 31 |
-
logger.error(f"Failed to load
|
| 32 |
raise
|
| 33 |
|
| 34 |
# آزادسازی حافظه
|
|
|
|
| 20 |
login(token=hf_token)
|
| 21 |
logger.debug("Hugging Face login successful")
|
| 22 |
|
| 23 |
+
# لود مدل Gemma 3 4B
|
| 24 |
+
logger.debug("Loading google/gemma-3-4b-it model")
|
| 25 |
try:
|
| 26 |
+
tokenizer = AutoTokenizer.from_pretrained("google/gemma-3-4b-it", cache_dir="/tmp/hf_cache")
|
| 27 |
+
model = AutoModelForCausalLM.from_pretrained("google/gemma-3-4b-it", cache_dir="/tmp/hf_cache", torch_dtype=torch.bfloat16, device_map="auto")
|
| 28 |
code_gen = pipeline("text-generation", model=model, tokenizer=tokenizer, max_new_tokens=512, temperature=0.6, top_p=0.95)
|
| 29 |
+
logger.debug("google/gemma-3-4b-it model loaded")
|
| 30 |
except Exception as e:
|
| 31 |
+
logger.error(f"Failed to load Gemma 3 model: {e}")
|
| 32 |
raise
|
| 33 |
|
| 34 |
# آزادسازی حافظه
|