Senath commited on
Commit
7ce9df0
·
verified ·
1 Parent(s): f81d953

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +14 -16
app.py CHANGED
@@ -18,39 +18,37 @@ def translate(text_input, audio_input, source_lang, target_lang, auto_detect):
18
  translated_text = None
19
  translated_audio = None
20
 
21
- # If text is provided
22
  if text_input:
23
  inputs = processor(text=text_input, src_lang=src, return_tensors="pt").to(device)
24
-
25
- # Generate speech
26
  speech = model.generate(**inputs, tgt_lang=target_lang)[0].cpu().numpy().squeeze()
 
27
 
28
- # Generate text
29
  text_tokens = model.generate(**inputs, tgt_lang=target_lang, generate_speech=False)
30
- translated_text = processor.decode(text_tokens[0].tolist()[0], skip_special_tokens=True)
31
-
32
- translated_audio = (16000, speech)
33
 
34
- # If audio is provided
35
  elif audio_input:
36
  waveform, sr = torchaudio.load(audio_input)
37
  waveform = torchaudio.functional.resample(waveform, sr, 16000)
38
  inputs = processor(audios=waveform, src_lang=src, return_tensors="pt").to(device)
39
 
40
- # Generate speech
41
  speech = model.generate(**inputs, tgt_lang=target_lang)[0].cpu().numpy().squeeze()
 
42
 
43
- # Generate text
44
  text_tokens = model.generate(**inputs, tgt_lang=target_lang, generate_speech=False)
45
- translated_text = processor.decode(text_tokens[0].tolist()[0], skip_special_tokens=True)
46
-
47
- translated_audio = (16000, speech)
48
 
49
  if translated_text or translated_audio:
50
  return translated_text or "", translated_audio
51
  return "No input provided.", None
52
 
53
- # Gradio UI
54
  iface = gr.Interface(
55
  fn=translate,
56
  inputs=[
@@ -67,6 +65,6 @@ iface = gr.Interface(
67
  title="iVoice Translate (Text + Speech)"
68
  ).queue()
69
 
70
- # Launch server
71
  if __name__ == "__main__":
72
- iface.launch(server_name="0.0.0.0", share=True, server_port=int(os.environ.get("PORT", 7860)))
 
18
  translated_text = None
19
  translated_audio = None
20
 
21
+ # If text input is provided
22
  if text_input:
23
  inputs = processor(text=text_input, src_lang=src, return_tensors="pt").to(device)
24
+
25
+ # Generate translated speech
26
  speech = model.generate(**inputs, tgt_lang=target_lang)[0].cpu().numpy().squeeze()
27
+ translated_audio = (16000, speech)
28
 
29
+ # Generate translated text
30
  text_tokens = model.generate(**inputs, tgt_lang=target_lang, generate_speech=False)
31
+ translated_text = processor.decode(text_tokens[0].tolist(), skip_special_tokens=True)
 
 
32
 
33
+ # If audio input is provided
34
  elif audio_input:
35
  waveform, sr = torchaudio.load(audio_input)
36
  waveform = torchaudio.functional.resample(waveform, sr, 16000)
37
  inputs = processor(audios=waveform, src_lang=src, return_tensors="pt").to(device)
38
 
39
+ # Generate translated speech
40
  speech = model.generate(**inputs, tgt_lang=target_lang)[0].cpu().numpy().squeeze()
41
+ translated_audio = (16000, speech)
42
 
43
+ # Generate translated text
44
  text_tokens = model.generate(**inputs, tgt_lang=target_lang, generate_speech=False)
45
+ translated_text = processor.decode(text_tokens[0].tolist(), skip_special_tokens=True)
 
 
46
 
47
  if translated_text or translated_audio:
48
  return translated_text or "", translated_audio
49
  return "No input provided.", None
50
 
51
+ # Gradio Interface
52
  iface = gr.Interface(
53
  fn=translate,
54
  inputs=[
 
65
  title="iVoice Translate (Text + Speech)"
66
  ).queue()
67
 
68
+ # Launch app
69
  if __name__ == "__main__":
70
+ iface.launch(server_name="0.0.0.0", share=True, server_port=int(os.environ.get("PORT", 7860)))