Spaces:

Mr-Help
/

test-api

Runtime error

App Files Files Community

Mr-Help commited on 15 days ago

Commit

6cef2a4

verified ·

1 Parent(s): a42f9f6

Update main.py

Browse files

Files changed (1) hide show

main.py +51 -11

main.py CHANGED Viewed

@@ -1,15 +1,55 @@
-from fastapi import FastAPI, Request
-app = FastAPI()
-@app.post("/receive")
-async def receive_data(request: Request):
-    try:
-        data = await request.json()
-    except:
-        data = await request.body()
-    print("📥 RECEIVED ON HF BACKEND:")
-    print(data)
-    return {"status": "ok", "received": data}

+import torch
+from transformers import AutoModelForCausalLM, AutoTokenizer
+MODEL_NAME = "Qwen/Qwen2.5-7B-Instruct"
+def main():
+    # Load tokenizer
+    tokenizer = AutoTokenizer.from_pretrained(MODEL_NAME)
+    # Pick dtype مناسب: bfloat16 لو GPU متاح، غير كده float32 على CPU
+    has_cuda = torch.cuda.is_available()
+    dtype = torch.bfloat16 if has_cuda else torch.float32
+    # Load model (device_map="auto" يوزع تلقائي)
+    model = AutoModelForCausalLM.from_pretrained(
+        MODEL_NAME,
+        torch_dtype=dtype,
+        device_map="auto"
+    )
+    # Prompt: explain Past Simple in simple English
+    messages = [
+        {"role": "system", "content": "You are a friendly English teacher. Explain clearly and simply."},
+        {"role": "user", "content": "Explain the Past Simple tense in very simple English. Give rules and 8 short examples. Keep it clear for A2 learners."}
+    ]
+    # Convert chat messages to model input
+    text = tokenizer.apply_chat_template(
+        messages,
+        tokenize=False,
+        add_generation_prompt=True
+    )
+    model_inputs = tokenizer([text], return_tensors="pt").to(model.device)
+    # Generate
+    with torch.no_grad():
+        generated_ids = model.generate(
+            **model_inputs,
+            max_new_tokens=400,
+            do_sample=True,
+            temperature=0.7,
+            top_p=0.9
+        )
+    # Keep only the newly generated tokens (remove the prompt tokens)
+    new_tokens = generated_ids[0, model_inputs["input_ids"].shape[-1]:]
+    response = tokenizer.decode(new_tokens, skip_special_tokens=True)
+    print("\n=== Model Response ===\n")
+    print(response.strip())
+    print("\n======================\n")
+if __name__ == "__main__":
+    main()