roseyai JavaFXpert commited on
Commit
1a58232
·
0 Parent(s):

Duplicate from JavaFXpert/Chat-GPT-LangChain

Browse files

Co-authored-by: James Weaver <JavaFXpert@users.noreply.huggingface.co>

.gitattributes ADDED
@@ -0,0 +1,36 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ *.7z filter=lfs diff=lfs merge=lfs -text
2
+ *.arrow filter=lfs diff=lfs merge=lfs -text
3
+ *.bin filter=lfs diff=lfs merge=lfs -text
4
+ *.bz2 filter=lfs diff=lfs merge=lfs -text
5
+ *.ckpt filter=lfs diff=lfs merge=lfs -text
6
+ *.ftz filter=lfs diff=lfs merge=lfs -text
7
+ *.gz filter=lfs diff=lfs merge=lfs -text
8
+ *.h5 filter=lfs diff=lfs merge=lfs -text
9
+ *.joblib filter=lfs diff=lfs merge=lfs -text
10
+ *.lfs.* filter=lfs diff=lfs merge=lfs -text
11
+ *.mlmodel filter=lfs diff=lfs merge=lfs -text
12
+ *.model filter=lfs diff=lfs merge=lfs -text
13
+ *.msgpack filter=lfs diff=lfs merge=lfs -text
14
+ *.npy filter=lfs diff=lfs merge=lfs -text
15
+ *.npz filter=lfs diff=lfs merge=lfs -text
16
+ *.onnx filter=lfs diff=lfs merge=lfs -text
17
+ *.ot filter=lfs diff=lfs merge=lfs -text
18
+ *.parquet filter=lfs diff=lfs merge=lfs -text
19
+ *.pb filter=lfs diff=lfs merge=lfs -text
20
+ *.pickle filter=lfs diff=lfs merge=lfs -text
21
+ *.pkl filter=lfs diff=lfs merge=lfs -text
22
+ *.pt filter=lfs diff=lfs merge=lfs -text
23
+ *.pth filter=lfs diff=lfs merge=lfs -text
24
+ *.rar filter=lfs diff=lfs merge=lfs -text
25
+ *.safetensors filter=lfs diff=lfs merge=lfs -text
26
+ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
27
+ *.tar.* filter=lfs diff=lfs merge=lfs -text
28
+ *.tflite filter=lfs diff=lfs merge=lfs -text
29
+ *.tgz filter=lfs diff=lfs merge=lfs -text
30
+ *.wasm filter=lfs diff=lfs merge=lfs -text
31
+ *.xz filter=lfs diff=lfs merge=lfs -text
32
+ *.zip filter=lfs diff=lfs merge=lfs -text
33
+ *.zst filter=lfs diff=lfs merge=lfs -text
34
+ *tfevents* filter=lfs diff=lfs merge=lfs -text
35
+ *.mp4 filter=lfs diff=lfs merge=lfs -text
36
+ *.png filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ title: Chat GPT LangChain
3
+ emoji: 👀
4
+ colorFrom: red
5
+ colorTo: gray
6
+ sdk: gradio
7
+ sdk_version: 3.16.1
8
+ app_file: app.py
9
+ pinned: false
10
+ license: apache-2.0
11
+ duplicated_from: JavaFXpert/Chat-GPT-LangChain
12
+ ---
13
+
14
+ Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference
app.py ADDED
@@ -0,0 +1,629 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import io
2
+ import os
3
+ from contextlib import closing
4
+ from typing import Optional, Tuple
5
+ import datetime
6
+
7
+ import boto3
8
+ import gradio as gr
9
+ import requests
10
+
11
+ # UNCOMMENT TO USE WHISPER
12
+ # import warnings
13
+ # import whisper
14
+
15
+ from langchain import ConversationChain, LLMChain
16
+
17
+ from langchain.agents import load_tools, initialize_agent
18
+ from langchain.chains.conversation.memory import ConversationBufferMemory
19
+ from langchain.llms import OpenAI
20
+ from threading import Lock
21
+
22
+
23
+ # Console to variable
24
+ from io import StringIO
25
+ import sys
26
+ import re
27
+
28
+ from openai.error import AuthenticationError, InvalidRequestError, RateLimitError
29
+
30
+ # Pertains to Express-inator functionality
31
+ from langchain.prompts import PromptTemplate
32
+
33
+ from polly_utils import PollyVoiceData, NEURAL_ENGINE
34
+
35
+ news_api_key = os.environ["NEWS_API_KEY"]
36
+ tmdb_bearer_token = os.environ["TMDB_BEARER_TOKEN"]
37
+
38
+ TOOLS_LIST = ['serpapi', 'wolfram-alpha', 'google-search', 'pal-math', 'pal-colored-objects', 'news-api', 'tmdb-api',
39
+ 'open-meteo-api']
40
+ TOOLS_DEFAULT_LIST = ['serpapi', 'pal-math']
41
+ BUG_FOUND_MSG = "Congratulations, you've found a bug in this application!"
42
+ AUTH_ERR_MSG = "Please paste your OpenAI key."
43
+ MAX_TOKENS = 512
44
+
45
+ # Pertains to Express-inator functionality
46
+ NUM_WORDS_DEFAULT = 0
47
+ MAX_WORDS = 400
48
+ FORMALITY_DEFAULT = "N/A"
49
+ TEMPERATURE_DEFAULT = 0.5
50
+ EMOTION_DEFAULT = "N/A"
51
+ TRANSLATE_TO_DEFAULT = "N/A"
52
+ LITERARY_STYLE_DEFAULT = "N/A"
53
+ PROMPT_TEMPLATE = PromptTemplate(
54
+ input_variables=["original_words", "num_words", "formality", "emotions", "translate_to", "literary_style"],
55
+ template="Restate {num_words}{formality}{emotions}{translate_to}{literary_style}the following: \n{original_words}\n",
56
+ )
57
+
58
+ POLLY_VOICE_DATA = PollyVoiceData()
59
+
60
+
61
+ # UNCOMMENT TO USE WHISPER
62
+ # warnings.filterwarnings("ignore")
63
+ # WHISPER_MODEL = whisper.load_model("tiny")
64
+ # print("WHISPER_MODEL", WHISPER_MODEL)
65
+
66
+
67
+ # UNCOMMENT TO USE WHISPER
68
+ # def transcribe(aud_inp):
69
+ # if aud_inp is None:
70
+ # return ""
71
+ # aud = whisper.load_audio(aud_inp)
72
+ # aud = whisper.pad_or_trim(aud)
73
+ # mel = whisper.log_mel_spectrogram(aud).to(WHISPER_MODEL.device)
74
+ # _, probs = WHISPER_MODEL.detect_language(mel)
75
+ #
76
+ # options = whisper.DecodingOptions()
77
+ # # options = whisper.DecodingOptions(language="ja")
78
+ #
79
+ # result = whisper.decode(WHISPER_MODEL, mel, options)
80
+ # print("result.text", result.text)
81
+ # result_text = ""
82
+ # if result and result.text:
83
+ # result_text = result.text
84
+ # return result_text
85
+
86
+
87
+ # Pertains to Express-inator functionality
88
+ def transform_text(desc, express_chain, num_words, formality,
89
+ anticipation_level, joy_level, trust_level,
90
+ fear_level, surprise_level, sadness_level, disgust_level, anger_level,
91
+ translate_to, literary_style):
92
+ num_words_prompt = ""
93
+ if num_words and int(num_words) != 0:
94
+ num_words_prompt = "using up to " + str(num_words) + " words, "
95
+
96
+ # Change some arguments to lower case
97
+ formality = formality.lower()
98
+ anticipation_level = anticipation_level.lower()
99
+ joy_level = joy_level.lower()
100
+ trust_level = trust_level.lower()
101
+ fear_level = fear_level.lower()
102
+ surprise_level = surprise_level.lower()
103
+ sadness_level = sadness_level.lower()
104
+ disgust_level = disgust_level.lower()
105
+ anger_level = anger_level.lower()
106
+
107
+ formality_str = ""
108
+ if formality != "n/a":
109
+ formality_str = "in a " + formality + " manner, "
110
+
111
+ # put all emotions into a list
112
+ emotions = []
113
+ if anticipation_level != "n/a":
114
+ emotions.append(anticipation_level)
115
+ if joy_level != "n/a":
116
+ emotions.append(joy_level)
117
+ if trust_level != "n/a":
118
+ emotions.append(trust_level)
119
+ if fear_level != "n/a":
120
+ emotions.append(fear_level)
121
+ if surprise_level != "n/a":
122
+ emotions.append(surprise_level)
123
+ if sadness_level != "n/a":
124
+ emotions.append(sadness_level)
125
+ if disgust_level != "n/a":
126
+ emotions.append(disgust_level)
127
+ if anger_level != "n/a":
128
+ emotions.append(anger_level)
129
+
130
+ emotions_str = ""
131
+ if len(emotions) > 0:
132
+ if len(emotions) == 1:
133
+ emotions_str = "with emotion of " + emotions[0] + ", "
134
+ else:
135
+ emotions_str = "with emotions of " + ", ".join(emotions[:-1]) + " and " + emotions[-1] + ", "
136
+
137
+ translate_to_str = ""
138
+ if translate_to != TRANSLATE_TO_DEFAULT:
139
+ translate_to_str = "translated to " + translate_to + ", "
140
+
141
+ literary_style_str = ""
142
+ if literary_style != LITERARY_STYLE_DEFAULT:
143
+ if literary_style == "Prose":
144
+ literary_style_str = "as prose, "
145
+ elif literary_style == "Summary":
146
+ literary_style_str = "as a summary, "
147
+ elif literary_style == "Outline":
148
+ literary_style_str = "as an outline numbers and lower case letters, "
149
+ elif literary_style == "Bullets":
150
+ literary_style_str = "as bullet points using bullets, "
151
+ elif literary_style == "Poetry":
152
+ literary_style_str = "as a poem, "
153
+ elif literary_style == "Haiku":
154
+ literary_style_str = "as a haiku, "
155
+ elif literary_style == "Limerick":
156
+ literary_style_str = "as a limerick, "
157
+ elif literary_style == "Joke":
158
+ literary_style_str = "as a very funny joke with a setup and punchline, "
159
+ elif literary_style == "Knock-knock":
160
+ literary_style_str = "as a very funny knock-knock joke, "
161
+
162
+ formatted_prompt = PROMPT_TEMPLATE.format(
163
+ original_words=desc,
164
+ num_words=num_words_prompt,
165
+ formality=formality_str,
166
+ emotions=emotions_str,
167
+ translate_to=translate_to_str,
168
+ literary_style=literary_style_str
169
+ )
170
+
171
+ trans_instr = num_words_prompt + formality_str + emotions_str + translate_to_str + literary_style_str
172
+ if express_chain and len(trans_instr.strip()) > 0:
173
+ generated_text = express_chain.run(
174
+ {'original_words': desc, 'num_words': num_words_prompt, 'formality': formality_str,
175
+ 'emotions': emotions_str, 'translate_to': translate_to_str,
176
+ 'literary_style': literary_style_str}).strip()
177
+ else:
178
+ print("Not transforming text")
179
+ generated_text = desc
180
+
181
+ # replace all newlines with <br> in generated_text
182
+ generated_text = generated_text.replace("\n", "\n\n")
183
+
184
+ prompt_plus_generated = "GPT prompt: " + formatted_prompt + "\n\n" + generated_text
185
+
186
+ print("\n==== date/time: " + str(datetime.datetime.now() - datetime.timedelta(hours=5)) + " ====")
187
+ print("prompt_plus_generated: " + prompt_plus_generated)
188
+
189
+ return generated_text
190
+
191
+
192
+ def load_chain(tools_list, llm):
193
+ chain = None
194
+ express_chain = None
195
+ if llm:
196
+ print("\ntools_list", tools_list)
197
+ tool_names = tools_list
198
+ tools = load_tools(tool_names, llm=llm, news_api_key=news_api_key, tmdb_bearer_token=tmdb_bearer_token)
199
+
200
+ memory = ConversationBufferMemory(memory_key="chat_history")
201
+
202
+ chain = initialize_agent(tools, llm, agent="conversational-react-description", verbose=True, memory=memory)
203
+ express_chain = LLMChain(llm=llm, prompt=PROMPT_TEMPLATE, verbose=True)
204
+
205
+ return chain, express_chain
206
+
207
+
208
+ def set_openai_api_key(api_key):
209
+ """Set the api key and return chain.
210
+ If no api_key, then None is returned.
211
+ """
212
+ if api_key and api_key.startswith("sk-") and len(api_key) > 50:
213
+ os.environ["OPENAI_API_KEY"] = api_key
214
+ llm = OpenAI(temperature=0, max_tokens=MAX_TOKENS)
215
+ chain, express_chain = load_chain(TOOLS_DEFAULT_LIST, llm)
216
+ os.environ["OPENAI_API_KEY"] = ""
217
+ return chain, express_chain, llm
218
+ return None, None, None
219
+
220
+
221
+ def run_chain(chain, inp, capture_hidden_text):
222
+ output = ""
223
+ hidden_text = None
224
+ if capture_hidden_text:
225
+ error_msg = None
226
+ tmp = sys.stdout
227
+ hidden_text_io = StringIO()
228
+ sys.stdout = hidden_text_io
229
+
230
+ try:
231
+ output = chain.run(input=inp)
232
+ except AuthenticationError as ae:
233
+ error_msg = AUTH_ERR_MSG
234
+ except RateLimitError as rle:
235
+ error_msg = "\n\nRateLimitError: " + str(rle)
236
+ except ValueError as ve:
237
+ error_msg = "\n\nValueError: " + str(ve)
238
+ except InvalidRequestError as ire:
239
+ error_msg = "\n\nInvalidRequestError: " + str(ire)
240
+ except Exception as e:
241
+ error_msg = "\n\n" + BUG_FOUND_MSG + ":\n\n" + str(e)
242
+
243
+ sys.stdout = tmp
244
+ hidden_text = hidden_text_io.getvalue()
245
+
246
+ # remove escape characters from hidden_text
247
+ hidden_text = re.sub(r'\x1b[^m]*m', '', hidden_text)
248
+
249
+ # remove "Entering new AgentExecutor chain..." from hidden_text
250
+ hidden_text = re.sub(r"Entering new AgentExecutor chain...\n", "", hidden_text)
251
+
252
+ # remove "Finished chain." from hidden_text
253
+ hidden_text = re.sub(r"Finished chain.", "", hidden_text)
254
+
255
+ # Add newline after "Thought:" "Action:" "Observation:" "Input:" and "AI:"
256
+ hidden_text = re.sub(r"Thought:", "\n\nThought:", hidden_text)
257
+ hidden_text = re.sub(r"Action:", "\n\nAction:", hidden_text)
258
+ hidden_text = re.sub(r"Observation:", "\n\nObservation:", hidden_text)
259
+ hidden_text = re.sub(r"Input:", "\n\nInput:", hidden_text)
260
+ hidden_text = re.sub(r"AI:", "\n\nAI:", hidden_text)
261
+
262
+ if error_msg:
263
+ hidden_text += error_msg
264
+
265
+ print("hidden_text: ", hidden_text)
266
+ else:
267
+ try:
268
+ output = chain.run(input=inp)
269
+ except AuthenticationError as ae:
270
+ output = AUTH_ERR_MSG
271
+ except RateLimitError as rle:
272
+ output = "\n\nRateLimitError: " + str(rle)
273
+ except ValueError as ve:
274
+ output = "\n\nValueError: " + str(ve)
275
+ except InvalidRequestError as ire:
276
+ output = "\n\nInvalidRequestError: " + str(ire)
277
+ except Exception as e:
278
+ output = "\n\n" + BUG_FOUND_MSG + ":\n\n" + str(e)
279
+
280
+ return output, hidden_text
281
+
282
+
283
+ class ChatWrapper:
284
+
285
+ def __init__(self):
286
+ self.lock = Lock()
287
+
288
+ def __call__(
289
+ self, api_key: str, inp: str, history: Optional[Tuple[str, str]], chain: Optional[ConversationChain],
290
+ trace_chain: bool, speak_text: bool, express_chain: Optional[LLMChain],
291
+ num_words, formality, anticipation_level, joy_level, trust_level,
292
+ fear_level, surprise_level, sadness_level, disgust_level, anger_level,
293
+ translate_to, literary_style
294
+ ):
295
+ """Execute the chat functionality."""
296
+ self.lock.acquire()
297
+ try:
298
+ print("\n==== date/time: " + str(datetime.datetime.now()) + " ====")
299
+ print("inp: " + inp)
300
+ print("trace_chain: ", trace_chain)
301
+ print("speak_text: ", speak_text)
302
+ history = history or []
303
+ # If chain is None, that is because no API key was provided.
304
+ output = "Please paste your OpenAI key to use this application."
305
+ hidden_text = output
306
+
307
+ if chain and chain != "":
308
+ # Set OpenAI key
309
+ import openai
310
+ openai.api_key = api_key
311
+ output, hidden_text = run_chain(chain, inp, capture_hidden_text=trace_chain)
312
+
313
+ output = transform_text(output, express_chain, num_words, formality, anticipation_level, joy_level, trust_level,
314
+ fear_level, surprise_level, sadness_level, disgust_level, anger_level,
315
+ translate_to, literary_style)
316
+
317
+ text_to_display = output
318
+ if trace_chain:
319
+ text_to_display = hidden_text + "\n\n" + output
320
+ history.append((inp, text_to_display))
321
+
322
+ # html_video, temp_file = do_html_video_speak(output)
323
+ html_audio, temp_aud_file = None, None
324
+ if speak_text:
325
+ html_audio, temp_aud_file = do_html_audio_speak(output, translate_to)
326
+ except Exception as e:
327
+ raise e
328
+ finally:
329
+ self.lock.release()
330
+ # return history, history, html_video, temp_file, ""
331
+ return history, history, html_audio, temp_aud_file, ""
332
+
333
+
334
+ chat = ChatWrapper()
335
+
336
+
337
+ def do_html_audio_speak(words_to_speak, polly_language):
338
+ polly_client = boto3.Session(
339
+ aws_access_key_id=os.environ["AWS_ACCESS_KEY_ID"],
340
+ aws_secret_access_key=os.environ["AWS_SECRET_ACCESS_KEY"],
341
+ region_name=os.environ["AWS_DEFAULT_REGION"]
342
+ ).client('polly')
343
+
344
+ voice_id, language_code, engine = POLLY_VOICE_DATA.get_voice(polly_language, "Female")
345
+ if not voice_id:
346
+ voice_id = "Joanna"
347
+ language_code = "en-US"
348
+ engine = NEURAL_ENGINE
349
+ response = polly_client.synthesize_speech(
350
+ Text=words_to_speak,
351
+ OutputFormat='mp3',
352
+ VoiceId=voice_id,
353
+ LanguageCode=language_code,
354
+ Engine=engine
355
+ )
356
+
357
+ html_audio = '<pre>no audio</pre>'
358
+
359
+ # Save the audio stream returned by Amazon Polly on Lambda's temp directory
360
+ if "AudioStream" in response:
361
+ with closing(response["AudioStream"]) as stream:
362
+ # output = os.path.join("/tmp/", "speech.mp3")
363
+
364
+ try:
365
+ with open('audios/tempfile.mp3', 'wb') as f:
366
+ f.write(stream.read())
367
+ temp_aud_file = gr.File("audios/tempfile.mp3")
368
+ temp_aud_file_url = "/file=" + temp_aud_file.value['name']
369
+ html_audio = f'<audio autoplay><source src={temp_aud_file_url} type="audio/mp3"></audio>'
370
+ except IOError as error:
371
+ # Could not write to file, exit gracefully
372
+ print(error)
373
+ return None, None
374
+ else:
375
+ # The response didn't contain audio data, exit gracefully
376
+ print("Could not stream audio")
377
+ return None, None
378
+
379
+ return html_audio, "audios/tempfile.mp3"
380
+
381
+
382
+ def do_html_video_speak(words_to_speak):
383
+ headers = {"Authorization": f"Bearer {os.environ['EXHUMAN_API_KEY']}"}
384
+ body = {
385
+ 'bot_name': 'Masahiro',
386
+ 'bot_response': words_to_speak,
387
+ 'voice_name': 'Masahiro-EN'
388
+ }
389
+ api_endpoint = "https://api.exh.ai/animations/v1/generate_lipsync"
390
+ res = requests.post(api_endpoint, json=body, headers=headers)
391
+
392
+ html_video = '<pre>no video</pre>'
393
+ if isinstance(res.content, bytes):
394
+ response_stream = io.BytesIO(res.content)
395
+ with open('videos/tempfile.mp4', 'wb') as f:
396
+ f.write(response_stream.read())
397
+ temp_file = gr.File("videos/tempfile.mp4")
398
+ temp_file_url = "/file=" + temp_file.value['name']
399
+ html_video = f'<video width="256" height="256" autoplay><source src={temp_file_url} type="video/mp4" poster="Masahiro.png"></video>'
400
+ else:
401
+ print('video url unknown')
402
+ return html_video, "videos/tempfile.mp4"
403
+
404
+
405
+ def update_selected_tools(widget, state, llm):
406
+ if widget:
407
+ state = widget
408
+ chain, express_chain = load_chain(state, llm)
409
+ return state, llm, chain, express_chain
410
+
411
+
412
+ def update_foo(widget, state):
413
+ if widget:
414
+ state = widget
415
+ return state
416
+
417
+
418
+ with gr.Blocks(css=".gradio-container {background-color: lightgray}") as block:
419
+ llm_state = gr.State()
420
+ history_state = gr.State()
421
+ chain_state = gr.State()
422
+ express_chain_state = gr.State()
423
+ tools_list_state = gr.State(TOOLS_DEFAULT_LIST)
424
+ trace_chain_state = gr.State(False)
425
+ speak_text_state = gr.State(False)
426
+
427
+ # Pertains to Express-inator functionality
428
+ num_words_state = gr.State(NUM_WORDS_DEFAULT)
429
+ formality_state = gr.State(FORMALITY_DEFAULT)
430
+ anticipation_level_state = gr.State(EMOTION_DEFAULT)
431
+ joy_level_state = gr.State(EMOTION_DEFAULT)
432
+ trust_level_state = gr.State(EMOTION_DEFAULT)
433
+ fear_level_state = gr.State(EMOTION_DEFAULT)
434
+ surprise_level_state = gr.State(EMOTION_DEFAULT)
435
+ sadness_level_state = gr.State(EMOTION_DEFAULT)
436
+ disgust_level_state = gr.State(EMOTION_DEFAULT)
437
+ anger_level_state = gr.State(EMOTION_DEFAULT)
438
+ translate_to_state = gr.State(TRANSLATE_TO_DEFAULT)
439
+ literary_style_state = gr.State(LITERARY_STYLE_DEFAULT)
440
+
441
+ with gr.Tab("Chat"):
442
+ with gr.Row():
443
+ with gr.Column():
444
+ gr.Markdown("<h4><center>Conversational Agent using GPT-3.5 & LangChain</center></h4>")
445
+
446
+ openai_api_key_textbox = gr.Textbox(placeholder="Paste your OpenAI API key (sk-...)",
447
+ show_label=False, lines=1, type='password')
448
+
449
+ with gr.Row():
450
+ with gr.Column(scale=1, min_width=100, visible=False):
451
+ my_file = gr.File(label="Upload a file", type="file", visible=False)
452
+ tmp_file = gr.File("videos/Masahiro.mp4", visible=False)
453
+ tmp_file_url = "/file=" + tmp_file.value['name']
454
+ htm_video = f'<video width="256" height="256" autoplay muted loop><source src={tmp_file_url} type="video/mp4" poster="Masahiro.png"></video>'
455
+ video_html = gr.HTML(htm_video)
456
+
457
+ # my_aud_file = gr.File(label="Audio file", type="file", visible=True)
458
+ tmp_aud_file = gr.File("audios/tempfile.mp3", visible=False)
459
+ tmp_aud_file_url = "/file=" + tmp_aud_file.value['name']
460
+ htm_audio = f'<audio><source src={tmp_aud_file_url} type="audio/mp3"></audio>'
461
+ audio_html = gr.HTML(htm_audio)
462
+
463
+ with gr.Column(scale=3):
464
+ chatbot = gr.Chatbot()
465
+
466
+ with gr.Row():
467
+ message = gr.Textbox(label="What's on your mind??",
468
+ placeholder="What's the answer to life, the universe, and everything?",
469
+ lines=1)
470
+ submit = gr.Button(value="Send", variant="secondary").style(full_width=False)
471
+
472
+ # UNCOMMENT TO USE WHISPER
473
+ # with gr.Row():
474
+ # audio_comp = gr.Microphone(source="microphone", type="filepath", label="Just say it!",
475
+ # interactive=True, streaming=False)
476
+ # audio_comp.change(transcribe, inputs=[audio_comp], outputs=[message])
477
+
478
+ gr.Examples(
479
+ examples=["How many people live in Canada?",
480
+ "What is 2 to the 30th power?",
481
+ "How much did it rain in SF today?",
482
+ "Get me information about the movie 'Avatar'",
483
+ "What are the top tech headlines in the US?",
484
+ "On the desk, you see two blue booklets, two purple booklets, and two yellow pairs of sunglasses - "
485
+ "if I remove all the pairs of sunglasses from the desk, how many purple items remain on it?"],
486
+ inputs=message
487
+ )
488
+
489
+ with gr.Tab("Settings"):
490
+ tools_cb_group = gr.CheckboxGroup(label="Tools:", choices=TOOLS_LIST,
491
+ value=TOOLS_DEFAULT_LIST)
492
+ tools_cb_group.change(update_selected_tools,
493
+ inputs=[tools_cb_group, tools_list_state, llm_state],
494
+ outputs=[tools_list_state, llm_state, chain_state, express_chain_state])
495
+
496
+ trace_chain_cb = gr.Checkbox(label="Show reasoning chain in chat bubble", value=False)
497
+ trace_chain_cb.change(update_foo, inputs=[trace_chain_cb, trace_chain_state],
498
+ outputs=[trace_chain_state])
499
+
500
+ speak_text_cb = gr.Checkbox(label="Speak text from agent", value=False)
501
+ speak_text_cb.change(update_foo, inputs=[speak_text_cb, speak_text_state],
502
+ outputs=[speak_text_state])
503
+
504
+ with gr.Tab("Formality"):
505
+ formality_radio = gr.Radio(label="Formality:",
506
+ choices=[FORMALITY_DEFAULT, "Casual", "Polite", "Honorific"],
507
+ value=FORMALITY_DEFAULT)
508
+ formality_radio.change(update_foo,
509
+ inputs=[formality_radio, formality_state],
510
+ outputs=[formality_state])
511
+
512
+ with gr.Tab("Translate to"):
513
+ translate_to_radio = gr.Radio(label="Translate to:", choices=[
514
+ TRANSLATE_TO_DEFAULT, "Arabic", "Arabic (Gulf)", "Catalan", "Chinese (Cantonese)", "Chinese (Mandarin)",
515
+ "Danish", "Dutch", "English (Australian)", "English (British)", "English (Indian)", "English (New Zealand)",
516
+ "English (South African)", "English (US)", "English (Welsh)", "Finnish", "French", "French (Canadian)",
517
+ "German", "German (Austrian)", "Hindi", "Icelandic", "Indonesian", "Italian", "Japanese", "Korean", "Norwegian", "Polish",
518
+ "Portuguese (Brazilian)", "Portuguese (European)", "Romanian", "Russian", "Spanish (European)",
519
+ "Spanish (Mexican)", "Spanish (US)", "Swedish", "Turkish", "Ukrainian", "Welsh",
520
+ "emojis", "Gen Z slang", "how the stereotypical Karen would say it", "Klingon",
521
+ "Pirate", "Strange Planet expospeak technical talk", "Yoda"],
522
+ value=TRANSLATE_TO_DEFAULT)
523
+
524
+ translate_to_radio.change(update_foo,
525
+ inputs=[translate_to_radio, translate_to_state],
526
+ outputs=[translate_to_state])
527
+
528
+ with gr.Tab("Lit style"):
529
+ literary_style_radio = gr.Radio(label="Literary style:", choices=[
530
+ LITERARY_STYLE_DEFAULT, "Prose", "Summary", "Outline", "Bullets", "Poetry", "Haiku", "Limerick", "Joke",
531
+ "Knock-knock"],
532
+ value=LITERARY_STYLE_DEFAULT)
533
+
534
+ literary_style_radio.change(update_foo,
535
+ inputs=[literary_style_radio, literary_style_state],
536
+ outputs=[literary_style_state])
537
+
538
+ with gr.Tab("Emotions"):
539
+ anticipation_level_radio = gr.Radio(label="Anticipation level:",
540
+ choices=[EMOTION_DEFAULT, "Interest", "Anticipation", "Vigilance"],
541
+ value=EMOTION_DEFAULT)
542
+ anticipation_level_radio.change(update_foo,
543
+ inputs=[anticipation_level_radio, anticipation_level_state],
544
+ outputs=[anticipation_level_state])
545
+
546
+ joy_level_radio = gr.Radio(label="Joy level:",
547
+ choices=[EMOTION_DEFAULT, "Serenity", "Joy", "Ecstasy"],
548
+ value=EMOTION_DEFAULT)
549
+ joy_level_radio.change(update_foo,
550
+ inputs=[joy_level_radio, joy_level_state],
551
+ outputs=[joy_level_state])
552
+
553
+ trust_level_radio = gr.Radio(label="Trust level:",
554
+ choices=[EMOTION_DEFAULT, "Acceptance", "Trust", "Admiration"],
555
+ value=EMOTION_DEFAULT)
556
+ trust_level_radio.change(update_foo,
557
+ inputs=[trust_level_radio, trust_level_state],
558
+ outputs=[trust_level_state])
559
+
560
+ fear_level_radio = gr.Radio(label="Fear level:",
561
+ choices=[EMOTION_DEFAULT, "Apprehension", "Fear", "Terror"],
562
+ value=EMOTION_DEFAULT)
563
+ fear_level_radio.change(update_foo,
564
+ inputs=[fear_level_radio, fear_level_state],
565
+ outputs=[fear_level_state])
566
+
567
+ surprise_level_radio = gr.Radio(label="Surprise level:",
568
+ choices=[EMOTION_DEFAULT, "Distraction", "Surprise", "Amazement"],
569
+ value=EMOTION_DEFAULT)
570
+ surprise_level_radio.change(update_foo,
571
+ inputs=[surprise_level_radio, surprise_level_state],
572
+ outputs=[surprise_level_state])
573
+
574
+ sadness_level_radio = gr.Radio(label="Sadness level:",
575
+ choices=[EMOTION_DEFAULT, "Pensiveness", "Sadness", "Grief"],
576
+ value=EMOTION_DEFAULT)
577
+ sadness_level_radio.change(update_foo,
578
+ inputs=[sadness_level_radio, sadness_level_state],
579
+ outputs=[sadness_level_state])
580
+
581
+ disgust_level_radio = gr.Radio(label="Disgust level:",
582
+ choices=[EMOTION_DEFAULT, "Boredom", "Disgust", "Loathing"],
583
+ value=EMOTION_DEFAULT)
584
+ disgust_level_radio.change(update_foo,
585
+ inputs=[disgust_level_radio, disgust_level_state],
586
+ outputs=[disgust_level_state])
587
+
588
+ anger_level_radio = gr.Radio(label="Anger level:",
589
+ choices=[EMOTION_DEFAULT, "Annoyance", "Anger", "Rage"],
590
+ value=EMOTION_DEFAULT)
591
+ anger_level_radio.change(update_foo,
592
+ inputs=[anger_level_radio, anger_level_state],
593
+ outputs=[anger_level_state])
594
+
595
+ with gr.Tab("Max words"):
596
+ num_words_slider = gr.Slider(label="Max number of words to generate (0 for don't care)",
597
+ value=NUM_WORDS_DEFAULT, minimum=0, maximum=MAX_WORDS, step=10)
598
+ num_words_slider.change(update_foo,
599
+ inputs=[num_words_slider, num_words_state],
600
+ outputs=[num_words_state])
601
+
602
+ gr.HTML("""
603
+ This application, developed by <a href='https://www.linkedin.com/in/javafxpert/'>James L. Weaver</a>,
604
+ demonstrates a conversational agent implemented with OpenAI GPT-3.5 and LangChain.
605
+ When necessary, it leverages tools for complex math, searching the internet, and accessing news and weather.""")
606
+
607
+ gr.HTML("<center>Powered by <a href='https://github.com/hwchase17/langchain'>LangChain 🦜️🔗</a></center>")
608
+
609
+ message.submit(chat, inputs=[openai_api_key_textbox, message, history_state, chain_state, trace_chain_state, speak_text_state,
610
+ express_chain_state, num_words_state, formality_state,
611
+ anticipation_level_state, joy_level_state, trust_level_state, fear_level_state,
612
+ surprise_level_state, sadness_level_state, disgust_level_state, anger_level_state,
613
+ translate_to_state, literary_style_state],
614
+ # outputs=[chatbot, history_state, video_html, my_file, message])
615
+ outputs=[chatbot, history_state, audio_html, tmp_aud_file, message])
616
+
617
+ submit.click(chat, inputs=[openai_api_key_textbox, message, history_state, chain_state, trace_chain_state, speak_text_state,
618
+ express_chain_state, num_words_state, formality_state,
619
+ anticipation_level_state, joy_level_state, trust_level_state, fear_level_state,
620
+ surprise_level_state, sadness_level_state, disgust_level_state, anger_level_state,
621
+ translate_to_state, literary_style_state],
622
+ # outputs=[chatbot, history_state, video_html, my_file, message])
623
+ outputs=[chatbot, history_state, audio_html, tmp_aud_file, message])
624
+
625
+ openai_api_key_textbox.change(set_openai_api_key,
626
+ inputs=[openai_api_key_textbox],
627
+ outputs=[chain_state, express_chain_state, llm_state])
628
+
629
+ block.launch(debug=True)
audios/tempfile.mp3 ADDED
Binary file (35.2 kB). View file
 
images/Masahiro.png ADDED

Git LFS Details

  • SHA256: 215bfaa1bdb0ee4852988b29d480e2d1c2d9669eaa907ba25cc2d3dfa6ebfa4e
  • Pointer size: 132 Bytes
  • Size of remote file: 4.39 MB
polly_utils.py ADDED
@@ -0,0 +1,635 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # This class stores Polly voice data. Specifically, the class stores several records containing
2
+ # language, lang_code, gender, voice_id and engine. The class also has a method to return the
3
+ # voice_id, lang_code and engine given a language and gender.
4
+
5
+ NEURAL_ENGINE = "neural"
6
+ STANDARD_ENGINE = "standard"
7
+
8
+
9
+ class PollyVoiceData:
10
+ def get_voice(self, language, gender):
11
+ for voice in self.voice_data:
12
+ if voice['language'] == language and voice['gender'] == gender:
13
+ if voice['neural'] == 'Yes':
14
+ return voice['voice_id'], voice['lang_code'], NEURAL_ENGINE
15
+ for voice in self.voice_data:
16
+ if voice['language'] == language and voice['gender'] == gender:
17
+ if voice['standard'] == 'Yes':
18
+ return voice['voice_id'], voice['lang_code'], STANDARD_ENGINE
19
+ return None, None, None
20
+
21
+ def get_whisper_lang_code(self, language):
22
+ for voice in self.voice_data:
23
+ if voice['language'] == language:
24
+ return voice['whisper_lang_code']
25
+ return "en"
26
+
27
+ def __init__(self):
28
+ self.voice_data = [
29
+ {'language': 'Arabic',
30
+ 'lang_code': 'arb',
31
+ 'whisper_lang_code': 'ar',
32
+ 'voice_id': 'Zeina',
33
+ 'gender': 'Female',
34
+ 'neural': 'No',
35
+ 'standard': 'Yes'},
36
+ {'language': 'Arabic (Gulf)',
37
+ 'lang_code': 'ar-AE',
38
+ 'whisper_lang_code': 'ar',
39
+ 'voice_id': 'Hala',
40
+ 'gender': 'Female',
41
+ 'neural': 'Yes',
42
+ 'standard': 'No'},
43
+ {'language': 'Catalan',
44
+ 'lang_code': 'ca-ES',
45
+ 'whisper_lang_code': 'ca',
46
+ 'voice_id': 'Arlet',
47
+ 'gender': 'Female',
48
+ 'neural': 'Yes',
49
+ 'standard': 'No'},
50
+ {'language': 'Chinese (Cantonese)',
51
+ 'lang_code': 'yue-CN',
52
+ 'whisper_lang_code': 'zh',
53
+ 'voice_id': 'Hiujin',
54
+ 'gender': 'Female',
55
+ 'neural': 'Yes',
56
+ 'standard': 'No'},
57
+ {'language': 'Chinese (Mandarin)',
58
+ 'lang_code': 'cmn-CN',
59
+ 'whisper_lang_code': 'zh',
60
+ 'voice_id': 'Zhiyu',
61
+ 'gender': 'Female',
62
+ 'neural': 'Yes',
63
+ 'standard': 'No'},
64
+ {'language': 'Danish',
65
+ 'lang_code': 'da-DK',
66
+ 'whisper_lang_code': 'da',
67
+ 'voice_id': 'Naja',
68
+ 'gender': 'Female',
69
+ 'neural': 'No',
70
+ 'standard': 'Yes'},
71
+ {'language': 'Danish',
72
+ 'lang_code': 'da-DK',
73
+ 'whisper_lang_code': 'da',
74
+ 'voice_id': 'Mads',
75
+ 'gender': 'Male',
76
+ 'neural': 'No',
77
+ 'standard': 'Yes'},
78
+ {'language': 'Dutch',
79
+ 'lang_code': 'nl-NL',
80
+ 'whisper_lang_code': 'nl',
81
+ 'voice_id': 'Laura',
82
+ 'gender': 'Female',
83
+ 'neural': 'Yes',
84
+ 'standard': 'No'},
85
+ {'language': 'Dutch',
86
+ 'lang_code': 'nl-NL',
87
+ 'whisper_lang_code': 'nl',
88
+ 'voice_id': 'Lotte',
89
+ 'gender': 'Female',
90
+ 'neural': 'No',
91
+ 'standard': 'Yes'},
92
+ {'language': 'Dutch',
93
+ 'lang_code': 'nl-NL',
94
+ 'whisper_lang_code': 'nl',
95
+ 'voice_id': 'Ruben',
96
+ 'gender': 'Male',
97
+ 'neural': 'No',
98
+ 'standard': 'Yes'},
99
+ {'language': 'English (Australian)',
100
+ 'lang_code': 'en-AU',
101
+ 'whisper_lang_code': 'en',
102
+ 'voice_id': 'Nicole',
103
+ 'gender': 'Female',
104
+ 'neural': 'No',
105
+ 'standard': 'Yes'},
106
+ {'language': 'English (Australian)',
107
+ 'lang_code': 'en-AU',
108
+ 'whisper_lang_code': 'en',
109
+ 'voice_id': 'Olivia',
110
+ 'gender': 'Female',
111
+ 'neural': 'Yes',
112
+ 'standard': 'No'},
113
+ {'language': 'English (Australian)',
114
+ 'lang_code': 'en-AU',
115
+ 'whisper_lang_code': 'en',
116
+ 'voice_id': 'Russell',
117
+ 'gender': 'Male',
118
+ 'neural': 'No',
119
+ 'standard': 'Yes'},
120
+ {'language': 'English (British)',
121
+ 'lang_code': 'en-GB',
122
+ 'whisper_lang_code': 'en',
123
+ 'voice_id': 'Amy',
124
+ 'gender': 'Female',
125
+ 'neural': 'Yes',
126
+ 'standard': 'Yes'},
127
+ {'language': 'English (British)',
128
+ 'lang_code': 'en-GB',
129
+ 'whisper_lang_code': 'en',
130
+ 'voice_id': 'Emma',
131
+ 'gender': 'Female',
132
+ 'neural': 'Yes',
133
+ 'standard': 'Yes'},
134
+ {'language': 'English (British)',
135
+ 'lang_code': 'en-GB',
136
+ 'whisper_lang_code': 'en',
137
+ 'voice_id': 'Brian',
138
+ 'gender': 'Male',
139
+ 'neural': 'Yes',
140
+ 'standard': 'Yes'},
141
+ {'language': 'English (British)',
142
+ 'lang_code': 'en-GB',
143
+ 'whisper_lang_code': 'en',
144
+ 'voice_id': 'Arthur',
145
+ 'gender': 'Male',
146
+ 'neural': 'Yes',
147
+ 'standard': 'No'},
148
+ {'language': 'English (Indian)',
149
+ 'lang_code': 'en-IN',
150
+ 'whisper_lang_code': 'en',
151
+ 'voice_id': 'Aditi',
152
+ 'gender': 'Female',
153
+ 'neural': 'No',
154
+ 'standard': 'Yes'},
155
+ {'language': 'English (Indian)',
156
+ 'lang_code': 'en-IN',
157
+ 'whisper_lang_code': 'en',
158
+ 'voice_id': 'Raveena',
159
+ 'gender': 'Female',
160
+ 'neural': 'No',
161
+ 'standard': 'Yes'},
162
+ {'language': 'English (Indian)',
163
+ 'lang_code': 'en-IN',
164
+ 'whisper_lang_code': 'en',
165
+ 'voice_id': 'Kajal',
166
+ 'gender': 'Female',
167
+ 'neural': 'Yes',
168
+ 'standard': 'No'},
169
+ {'language': 'English (New Zealand)',
170
+ 'lang_code': 'en-NZ',
171
+ 'whisper_lang_code': 'en',
172
+ 'voice_id': 'Aria',
173
+ 'gender': 'Female',
174
+ 'neural': 'Yes',
175
+ 'standard': 'No'},
176
+ {'language': 'English (South African)',
177
+ 'lang_code': 'en-ZA',
178
+ 'whisper_lang_code': 'en',
179
+ 'voice_id': 'Ayanda',
180
+ 'gender': 'Female',
181
+ 'neural': 'Yes',
182
+ 'standard': 'No'},
183
+ {'language': 'English (US)',
184
+ 'lang_code': 'en-US',
185
+ 'whisper_lang_code': 'en',
186
+ 'voice_id': 'Ivy',
187
+ 'gender': 'Female (child)',
188
+ 'neural': 'Yes',
189
+ 'standard': 'Yes'},
190
+ {'language': 'English (US)',
191
+ 'lang_code': 'en-US',
192
+ 'whisper_lang_code': 'en',
193
+ 'voice_id': 'Joanna',
194
+ 'gender': 'Female',
195
+ 'neural': 'Yes',
196
+ 'standard': 'Yes'},
197
+ {'language': 'English (US)',
198
+ 'lang_code': 'en-US',
199
+ 'whisper_lang_code': 'en',
200
+ 'voice_id': 'Kendra',
201
+ 'gender': 'Female',
202
+ 'neural': 'Yes',
203
+ 'standard': 'Yes'},
204
+ {'language': 'English (US)',
205
+ 'lang_code': 'en-US',
206
+ 'whisper_lang_code': 'en',
207
+ 'voice_id': 'Kimberly',
208
+ 'gender': 'Female',
209
+ 'neural': 'Yes',
210
+ 'standard': 'Yes'},
211
+ {'language': 'English (US)',
212
+ 'lang_code': 'en-US',
213
+ 'whisper_lang_code': 'en',
214
+ 'voice_id': 'Salli',
215
+ 'gender': 'Female',
216
+ 'neural': 'Yes',
217
+ 'standard': 'Yes'},
218
+ {'language': 'English (US)',
219
+ 'lang_code': 'en-US',
220
+ 'whisper_lang_code': 'en',
221
+ 'voice_id': 'Joey',
222
+ 'gender': 'Male',
223
+ 'neural': 'Yes',
224
+ 'standard': 'Yes'},
225
+ {'language': 'English (US)',
226
+ 'lang_code': 'en-US',
227
+ 'whisper_lang_code': 'en',
228
+ 'voice_id': 'Justin',
229
+ 'gender': 'Male (child)',
230
+ 'neural': 'Yes',
231
+ 'standard': 'Yes'},
232
+ {'language': 'English (US)',
233
+ 'lang_code': 'en-US',
234
+ 'whisper_lang_code': 'en',
235
+ 'voice_id': 'Kevin',
236
+ 'gender': 'Male (child)',
237
+ 'neural': 'Yes',
238
+ 'standard': 'No'},
239
+ {'language': 'English (US)',
240
+ 'lang_code': 'en-US',
241
+ 'whisper_lang_code': 'en',
242
+ 'voice_id': 'Matthew',
243
+ 'gender': 'Male',
244
+ 'neural': 'Yes',
245
+ 'standard': 'Yes'},
246
+ {'language': 'English (Welsh)',
247
+ 'lang_code': 'en-GB-WLS',
248
+ 'whisper_lang_code': 'en',
249
+ 'voice_id': 'Geraint',
250
+ 'gender': 'Male',
251
+ 'neural': 'No',
252
+ 'standard': 'Yes'},
253
+ {'language': 'Finnish',
254
+ 'lang_code': 'fi-FI',
255
+ 'whisper_lang_code': 'fi',
256
+ 'voice_id': 'Suvi',
257
+ 'gender': 'Female',
258
+ 'neural': 'Yes',
259
+ 'standard': 'No'},
260
+ {'language': 'French',
261
+ 'lang_code': 'fr-FR',
262
+ 'whisper_lang_code': 'fr',
263
+ 'voice_id': 'Celine',
264
+ 'gender': 'Female',
265
+ 'neural': 'No',
266
+ 'standard': 'Yes'},
267
+ {'language': 'French',
268
+ 'lang_code': 'fr-FR',
269
+ 'whisper_lang_code': 'fr',
270
+ 'voice_id': 'Lea',
271
+ 'gender': 'Female',
272
+ 'neural': 'Yes',
273
+ 'standard': 'Yes'},
274
+ {'language': 'French',
275
+ 'lang_code': 'fr-FR',
276
+ 'whisper_lang_code': 'fr',
277
+ 'voice_id': 'Mathieu',
278
+ 'gender': 'Male',
279
+ 'neural': 'No',
280
+ 'standard': 'Yes'},
281
+ {'language': 'French (Canadian)',
282
+ 'lang_code': 'fr-CA',
283
+ 'whisper_lang_code': 'fr',
284
+ 'voice_id': 'Chantal',
285
+ 'gender': 'Female',
286
+ 'neural': 'No',
287
+ 'standard': 'Yes'},
288
+ {'language': 'French (Canadian)',
289
+ 'lang_code': 'fr-CA',
290
+ 'whisper_lang_code': 'fr',
291
+ 'voice_id': 'Gabrielle',
292
+ 'gender': 'Female',
293
+ 'neural': 'Yes',
294
+ 'standard': 'No'},
295
+ {'language': 'French (Canadian)',
296
+ 'lang_code': 'fr-CA',
297
+ 'whisper_lang_code': 'fr',
298
+ 'voice_id': 'Liam',
299
+ 'gender': 'Male',
300
+ 'neural': 'Yes',
301
+ 'standard': 'No'},
302
+ {'language': 'German',
303
+ 'lang_code': 'de-DE',
304
+ 'whisper_lang_code': 'de',
305
+ 'voice_id': 'Marlene',
306
+ 'gender': 'Female',
307
+ 'neural': 'No',
308
+ 'standard': 'Yes'},
309
+ {'language': 'German',
310
+ 'lang_code': 'de-DE',
311
+ 'whisper_lang_code': 'de',
312
+ 'voice_id': 'Vicki',
313
+ 'gender': 'Female',
314
+ 'neural': 'Yes',
315
+ 'standard': 'Yes'},
316
+ {'language': 'German',
317
+ 'lang_code': 'de-DE',
318
+ 'whisper_lang_code': 'de',
319
+ 'voice_id': 'Hans',
320
+ 'gender': 'Male',
321
+ 'neural': 'No',
322
+ 'standard': 'Yes'},
323
+ {'language': 'German',
324
+ 'lang_code': 'de-DE',
325
+ 'whisper_lang_code': 'de',
326
+ 'voice_id': 'Daniel',
327
+ 'gender': 'Male',
328
+ 'neural': 'Yes',
329
+ 'standard': 'No'},
330
+ {'language': 'German (Austrian)',
331
+ 'lang_code': 'de-AT',
332
+ 'whisper_lang_code': 'de',
333
+ 'voice_id': 'Hannah',
334
+ 'gender': 'Female',
335
+ 'neural': 'Yes',
336
+ 'standard': 'No'},
337
+ {'language': 'Hindi',
338
+ 'lang_code': 'hi-IN',
339
+ 'whisper_lang_code': 'hi',
340
+ 'voice_id': 'Aditi',
341
+ 'gender': 'Female',
342
+ 'neural': 'No',
343
+ 'standard': 'Yes'},
344
+ {'language': 'Hindi',
345
+ 'lang_code': 'hi-IN',
346
+ 'whisper_lang_code': 'hi',
347
+ 'voice_id': 'Kajal',
348
+ 'gender': 'Female',
349
+ 'neural': 'Yes',
350
+ 'standard': 'No'},
351
+ {'language': 'Icelandic',
352
+ 'lang_code': 'is-IS',
353
+ 'whisper_lang_code': 'is',
354
+ 'voice_id': 'Dora',
355
+ 'gender': 'Female',
356
+ 'neural': 'No',
357
+ 'standard': 'Yes'},
358
+ {'language': 'Icelandic',
359
+ 'lang_code': 'is-IS',
360
+ 'whisper_lang_code': 'is',
361
+ 'voice_id': 'Karl',
362
+ 'gender': 'Male',
363
+ 'neural': 'No',
364
+ 'standard': 'Yes'},
365
+ {'language': 'Italian',
366
+ 'lang_code': 'it-IT',
367
+ 'whisper_lang_code': 'it',
368
+ 'voice_id': 'Carla',
369
+ 'gender': 'Female',
370
+ 'neural': 'No',
371
+ 'standard': 'Yes'},
372
+ {'language': 'Italian',
373
+ 'lang_code': 'it-IT',
374
+ 'whisper_lang_code': 'it',
375
+ 'voice_id': 'Bianca',
376
+ 'gender': 'Female',
377
+ 'neural': 'Yes',
378
+ 'standard': 'Yes'},
379
+ {'language': 'Japanese',
380
+ 'lang_code': 'ja-JP',
381
+ 'whisper_lang_code': 'ja',
382
+ 'voice_id': 'Mizuki',
383
+ 'gender': 'Female',
384
+ 'neural': 'No',
385
+ 'standard': 'Yes'},
386
+ {'language': 'Japanese',
387
+ 'lang_code': 'ja-JP',
388
+ 'whisper_lang_code': 'ja',
389
+ 'voice_id': 'Takumi',
390
+ 'gender': 'Male',
391
+ 'neural': 'Yes',
392
+ 'standard': 'Yes'},
393
+ {'language': 'Korean',
394
+ 'lang_code': 'ko-KR',
395
+ 'whisper_lang_code': 'ko',
396
+ 'voice_id': 'Seoyeon',
397
+ 'gender': 'Female',
398
+ 'neural': 'Yes',
399
+ 'standard': 'Yes'},
400
+ {'language': 'Norwegian',
401
+ 'lang_code': 'nb-NO',
402
+ 'whisper_lang_code': 'no',
403
+ 'voice_id': 'Liv',
404
+ 'gender': 'Female',
405
+ 'neural': 'No',
406
+ 'standard': 'Yes'},
407
+ {'language': 'Norwegian',
408
+ 'lang_code': 'nb-NO',
409
+ 'whisper_lang_code': 'no',
410
+ 'voice_id': 'Ida',
411
+ 'gender': 'Female',
412
+ 'neural': 'Yes',
413
+ 'standard': 'No'},
414
+ {'language': 'Polish',
415
+ 'lang_code': 'pl-PL',
416
+ 'whisper_lang_code': 'pl',
417
+ 'voice_id': 'Ewa',
418
+ 'gender': 'Female',
419
+ 'neural': 'No',
420
+ 'standard': 'Yes'},
421
+ {'language': 'Polish',
422
+ 'lang_code': 'pl-PL',
423
+ 'whisper_lang_code': 'pl',
424
+ 'voice_id': 'Maja',
425
+ 'gender': 'Female',
426
+ 'neural': 'No',
427
+ 'standard': 'Yes'},
428
+ {'language': 'Polish',
429
+ 'lang_code': 'pl-PL',
430
+ 'whisper_lang_code': 'pl',
431
+ 'voice_id': 'Jacek',
432
+ 'gender': 'Male',
433
+ 'neural': 'No',
434
+ 'standard': 'Yes'},
435
+ {'language': 'Polish',
436
+ 'lang_code': 'pl-PL',
437
+ 'whisper_lang_code': 'pl',
438
+ 'voice_id': 'Jan',
439
+ 'gender': 'Male',
440
+ 'neural': 'No',
441
+ 'standard': 'Yes'},
442
+ {'language': 'Polish',
443
+ 'lang_code': 'pl-PL',
444
+ 'whisper_lang_code': 'pl',
445
+ 'voice_id': 'Ola',
446
+ 'gender': 'Female',
447
+ 'neural': 'Yes',
448
+ 'standard': 'No'},
449
+ {'language': 'Portuguese (Brazilian)',
450
+ 'lang_code': 'pt-BR',
451
+ 'whisper_lang_code': 'pt',
452
+ 'voice_id': 'Camila',
453
+ 'gender': 'Female',
454
+ 'neural': 'Yes',
455
+ 'standard': 'Yes'},
456
+ {'language': 'Portuguese (Brazilian)',
457
+ 'lang_code': 'pt-BR',
458
+ 'whisper_lang_code': 'pt',
459
+ 'voice_id': 'Vitoria',
460
+ 'gender': 'Female',
461
+ 'neural': 'Yes',
462
+ 'standard': 'Yes'},
463
+ {'language': 'Portuguese (Brazilian)',
464
+ 'lang_code': 'pt-BR',
465
+ 'whisper_lang_code': 'pt',
466
+ 'voice_id': 'Ricardo',
467
+ 'gender': 'Male',
468
+ 'neural': 'No',
469
+ 'standard': 'Yes'},
470
+ {'language': 'Portuguese (European)',
471
+ 'lang_code': 'pt-PT',
472
+ 'whisper_lang_code': 'pt',
473
+ 'voice_id': 'Ines',
474
+ 'gender': 'Female',
475
+ 'neural': 'Yes',
476
+ 'standard': 'Yes'},
477
+ {'language': 'Portuguese (European)',
478
+ 'lang_code': 'pt-PT',
479
+ 'whisper_lang_code': 'pt',
480
+ 'voice_id': 'Cristiano',
481
+ 'gender': 'Male',
482
+ 'neural': 'No',
483
+ 'standard': 'Yes'},
484
+ {'language': 'Romanian',
485
+ 'lang_code': 'ro-RO',
486
+ 'whisper_lang_code': 'ro',
487
+ 'voice_id': 'Carmen',
488
+ 'gender': 'Female',
489
+ 'neural': 'No',
490
+ 'standard': 'Yes'},
491
+ {'language': 'Russian',
492
+ 'lang_code': 'ru-RU',
493
+ 'whisper_lang_code': 'ru',
494
+ 'voice_id': 'Tatyana',
495
+ 'gender': 'Female',
496
+ 'neural': 'No',
497
+ 'standard': 'Yes'},
498
+ {'language': 'Russian',
499
+ 'lang_code': 'ru-RU',
500
+ 'whisper_lang_code': 'ru',
501
+ 'voice_id': 'Maxim',
502
+ 'gender': 'Male',
503
+ 'neural': 'No',
504
+ 'standard': 'Yes'},
505
+ {'language': 'Spanish (European)',
506
+ 'lang_code': 'es-ES',
507
+ 'whisper_lang_code': 'es',
508
+ 'voice_id': 'Conchita',
509
+ 'gender': 'Female',
510
+ 'neural': 'No',
511
+ 'standard': 'Yes'},
512
+ {'language': 'Spanish (European)',
513
+ 'lang_code': 'es-ES',
514
+ 'whisper_lang_code': 'es',
515
+ 'voice_id': 'Lucia',
516
+ 'gender': 'Female',
517
+ 'neural': 'Yes',
518
+ 'standard': 'Yes'},
519
+ {'language': 'Spanish (European)',
520
+ 'lang_code': 'es-ES',
521
+ 'whisper_lang_code': 'es',
522
+ 'voice_id': 'Enrique',
523
+ 'gender': 'Male',
524
+ 'neural': 'No',
525
+ 'standard': 'Yes'},
526
+ {'language': 'Spanish (Mexican)',
527
+ 'lang_code': 'es-MX',
528
+ 'whisper_lang_code': 'es',
529
+ 'voice_id': 'Mia',
530
+ 'gender': 'Female',
531
+ 'neural': 'Yes',
532
+ 'standard': 'Yes'},
533
+ {'language': 'Spanish (US)',
534
+ 'lang_code': 'es-US',
535
+ 'whisper_lang_code': 'es',
536
+ 'voice_id': 'Lupe',
537
+ 'gender': 'Female',
538
+ 'neural': 'Yes',
539
+ 'standard': 'Yes'},
540
+ {'language': 'Spanish (US)',
541
+ 'lang_code': 'es-US',
542
+ 'whisper_lang_code': 'es',
543
+ 'voice_id': 'Penelope',
544
+ 'gender': 'Female',
545
+ 'neural': 'No',
546
+ 'standard': 'Yes'},
547
+ {'language': 'Spanish (US)',
548
+ 'lang_code': 'es-US',
549
+ 'whisper_lang_code': 'es',
550
+ 'voice_id': 'Miguel',
551
+ 'gender': 'Male',
552
+ 'neural': 'No',
553
+ 'standard': 'Yes'},
554
+ {'language': 'Spanish (US)',
555
+ 'lang_code': 'es-US',
556
+ 'whisper_lang_code': 'es',
557
+ 'voice_id': 'Pedro',
558
+ 'gender': 'Male',
559
+ 'neural': 'Yes',
560
+ 'standard': 'No'},
561
+ {'language': 'Swedish',
562
+ 'lang_code': 'sv-SE',
563
+ 'whisper_lang_code': 'sv',
564
+ 'voice_id': 'Astrid',
565
+ 'gender': 'Female',
566
+ 'neural': 'No',
567
+ 'standard': 'Yes'},
568
+ {'language': 'Swedish',
569
+ 'lang_code': 'sv-SE',
570
+ 'whisper_lang_code': 'sv',
571
+ 'voice_id': 'Elin',
572
+ 'gender': 'Female',
573
+ 'neural': 'Yes',
574
+ 'standard': 'No'},
575
+ {'language': 'Turkish',
576
+ 'lang_code': 'tr-TR',
577
+ 'whisper_lang_code': 'tr',
578
+ 'voice_id': 'Filiz',
579
+ 'gender': 'Female',
580
+ 'neural': 'No',
581
+ 'standard': 'Yes'},
582
+ {'language': 'Welsh',
583
+ 'lang_code': 'cy-GB',
584
+ 'whisper_lang_code': 'cy',
585
+ 'voice_id': 'Gwyneth',
586
+ 'gender': 'Female',
587
+ 'neural': 'No',
588
+ 'standard': 'Yes'}
589
+ ]
590
+
591
+
592
+ # Run from the command-line
593
+ if __name__ == '__main__':
594
+ polly_voice_data = PollyVoiceData()
595
+
596
+ voice_id, language_code, engine = polly_voice_data.get_voice('English (US)', 'Male')
597
+ print('English (US)', 'Male', voice_id, language_code, engine)
598
+
599
+ voice_id, language_code, engine = polly_voice_data.get_voice('English (US)', 'Female')
600
+ print('English (US)', 'Female', voice_id, language_code, engine)
601
+
602
+ voice_id, language_code, engine = polly_voice_data.get_voice('French', 'Female')
603
+ print('French', 'Female', voice_id, language_code, engine)
604
+
605
+ voice_id, language_code, engine = polly_voice_data.get_voice('French', 'Male')
606
+ print('French', 'Male', voice_id, language_code, engine)
607
+
608
+ voice_id, language_code, engine = polly_voice_data.get_voice('Japanese', 'Female')
609
+ print('Japanese', 'Female', voice_id, language_code, engine)
610
+
611
+ voice_id, language_code, engine = polly_voice_data.get_voice('Japanese', 'Male')
612
+ print('Japanese', 'Male', voice_id, language_code, engine)
613
+
614
+ voice_id, language_code, engine = polly_voice_data.get_voice('Hindi', 'Female')
615
+ print('Hindi', 'Female', voice_id, language_code, engine)
616
+
617
+ voice_id, language_code, engine = polly_voice_data.get_voice('Hindi', 'Male')
618
+ print('Hindi', 'Male', voice_id, language_code, engine)
619
+
620
+ whisper_lang_code = polly_voice_data.get_whisper_lang_code('English (US)')
621
+ print('English (US) whisper_lang_code:', whisper_lang_code)
622
+
623
+ whisper_lang_code = polly_voice_data.get_whisper_lang_code('Chinese (Mandarin)')
624
+ print('Chinese (Mandarin) whisper_lang_code:', whisper_lang_code)
625
+
626
+ whisper_lang_code = polly_voice_data.get_whisper_lang_code('Norwegian')
627
+ print('Norwegian whisper_lang_code:', whisper_lang_code)
628
+
629
+ whisper_lang_code = polly_voice_data.get_whisper_lang_code('Dutch')
630
+ print('Dutch whisper_lang_code:', whisper_lang_code)
631
+
632
+ whisper_lang_code = polly_voice_data.get_whisper_lang_code('Foo')
633
+ print('Foo whisper_lang_code:', whisper_lang_code)
634
+
635
+
requirements.txt ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ openai==0.26.1
2
+ gradio==3.16.2
3
+ google-search-results
4
+ google-api-python-client==2.72.0
5
+ wolframalpha
6
+ langchain==0.0.63
7
+ requests==2.28.2
8
+ git+https://github.com/openai/whisper.git
9
+ boto3
videos/Masahiro.mp4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca886517414fae8bcea5a5130ae1d01ef3ead7aed437203abebf032217fd0be6
3
+ size 2425212
videos/tempfile.mp4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:80aa42c48e322cc8da957e8d2e2aba7f1cd5675abb998146facf83a279a1c07d
3
+ size 80784