Spaces:

Sammaali
/

Post_Process_Elevenlabs

Sleeping

Sammaali commited on 10 days ago

Commit

b61fa99

verified ·

1 Parent(s): c147ba9

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -22,23 +22,27 @@ tokenizer = AutoTokenizer.from_pretrained(model_id)
 model = AutoModelForCausalLM.from_pretrained(
     model_id,
-    torch_dtype=torch.float16,
-    device_map="auto"
 )
 # =========================
 # Clean Text Using Gemma
 # =========================
 def clean_text(text):
     prompt = f"""
-You are an assistant that cleans Arabic speech transcripts.
-Tasks:
-- remove filler words (اممم، آآآ، يعني)
-- remove repeated words
-- keep the same meaning
-- return only the cleaned text
 Transcript:
 {text}
@@ -47,17 +51,19 @@ Transcript:
     inputs = tokenizer(prompt, return_tensors="pt").to(model.device)
     with torch.no_grad():
         outputs = model.generate(
             **inputs,
-            max_new_tokens=200,
-            temperature=0.2
         )
     result = tokenizer.decode(outputs[0], skip_special_tokens=True)
-    return result
-# =========================
 # ElevenLabs Speech To Text
 # =========================

 model = AutoModelForCausalLM.from_pretrained(
     model_id,
+    torch_dtype=torch.float32
 )
+device = "cuda" if torch.cuda.is_available() else "cpu"
+model.to(device)
 # =========================
 # Clean Text Using Gemma
 # =========================
 def clean_text(text):
+    text = text[:1500]
     prompt = f"""
+Clean this Arabic speech transcript.
+Remove filler words like:
+اممم، آآآ، يعني
+Remove repeated words.
+Keep the same meaning.
 Transcript:
 {text}
     inputs = tokenizer(prompt, return_tensors="pt").to(model.device)
     with torch.no_grad():
         outputs = model.generate(
             **inputs,
+            max_new_tokens=120,
+            do_sample=True,
+            temperature=0.7,
+            top_p=0.9,
+            repetition_penalty=1.2
         )
     result = tokenizer.decode(outputs[0], skip_special_tokens=True)
+    return result# =========================
 # ElevenLabs Speech To Text
 # =========================