legolasyiu commited on
Commit
d4f45f5
·
verified ·
1 Parent(s): dcfe34b

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +14 -11
app.py CHANGED
@@ -21,17 +21,20 @@ def convert_audio_to_text(audio_file):
21
 
22
  prompt = "Transcribe the audio."
23
 
24
- inputs = processor(
25
- text=prompt,
26
- audio=waveform.squeeze(),
27
- sampling_rate=sample_rate,
28
- return_tensors="pt"
29
- ).to(model.device)
30
-
31
- with torch.no_grad():
32
- output = model.generate(**inputs, max_new_tokens=512)
33
-
34
- result = processor.decode(output[0], skip_special_tokens=True)
 
 
 
35
  return result
36
 
37
 
 
21
 
22
  prompt = "Transcribe the audio."
23
 
24
+ inputs = processor.apply_chat_template(
25
+ messages,
26
+ add_generation_prompt=True,
27
+ tokenize=True, return_dict=True,
28
+ return_tensors="pt",
29
+ )
30
+
31
+ outputs = model.generate(**input_ids, max_new_tokens=512)
32
+
33
+ result = processor.batch_decode(
34
+ outputs,
35
+ skip_special_tokens=False,
36
+ clean_up_tokenization_spaces=False
37
+ )
38
  return result
39
 
40