Update app.py
Browse files
app.py
CHANGED
|
@@ -17,9 +17,10 @@ if check_password():
|
|
| 17 |
initial_base_prompt = os.getenv('BASE_PROMPT')
|
| 18 |
initial_processing_prompt = os.getenv('PROCCESS_PROMPT')
|
| 19 |
|
|
|
|
|
|
|
| 20 |
llm = st.sidebar.selectbox("LLM", ["GigaChat", "Chat GPT"], index=0)
|
| 21 |
base_prompt = st.sidebar.text_area("Промпт для резюмирования", value=initial_base_prompt)
|
| 22 |
-
max_tokens_summary = st.sidebar.number_input("Максимальное количество токенов при резюмировании", min_value=1, value=1024)
|
| 23 |
|
| 24 |
enable_processing = st.sidebar.checkbox("Добавить обработку транскрибации", value=False)
|
| 25 |
processing_prompt = st.sidebar.text_area("Промпт для обработки транскрибации", value=initial_processing_prompt)
|
|
@@ -63,7 +64,7 @@ if check_password():
|
|
| 63 |
print('Aligned, now diarizing')
|
| 64 |
|
| 65 |
diarize_model = whisperx.DiarizationPipeline(use_auth_token=st.secrets["HF_TOKEN"], device=device)
|
| 66 |
-
diarize_segments = diarize_model(audio)
|
| 67 |
result_diar = whisperx.assign_word_speakers(diarize_segments, result)
|
| 68 |
|
| 69 |
transcript = convert_segments_object_to_text_simple(result_diar)
|
|
@@ -93,9 +94,9 @@ if check_password():
|
|
| 93 |
|
| 94 |
with st.spinner('Резюмируем...'):
|
| 95 |
if (llm == 'GigaChat'):
|
| 96 |
-
summary_answer = get_completion_from_gigachat(base_prompt + transcript,
|
| 97 |
elif (llm == 'Chat GPT'):
|
| 98 |
-
summary_answer = get_completion_from_openai(base_prompt + transcript,
|
| 99 |
|
| 100 |
st.write("Результат резюмирования:")
|
| 101 |
st.text(summary_answer)
|
|
|
|
| 17 |
initial_base_prompt = os.getenv('BASE_PROMPT')
|
| 18 |
initial_processing_prompt = os.getenv('PROCCESS_PROMPT')
|
| 19 |
|
| 20 |
+
min_speakers = st.sidebar.number_input("Минимальное количество спикеров", min_value=1, value=2)
|
| 21 |
+
max_speakers = st.sidebar.number_input("Максимальное количество спикеров", min_value=1, value=2)
|
| 22 |
llm = st.sidebar.selectbox("LLM", ["GigaChat", "Chat GPT"], index=0)
|
| 23 |
base_prompt = st.sidebar.text_area("Промпт для резюмирования", value=initial_base_prompt)
|
|
|
|
| 24 |
|
| 25 |
enable_processing = st.sidebar.checkbox("Добавить обработку транскрибации", value=False)
|
| 26 |
processing_prompt = st.sidebar.text_area("Промпт для обработки транскрибации", value=initial_processing_prompt)
|
|
|
|
| 64 |
print('Aligned, now diarizing')
|
| 65 |
|
| 66 |
diarize_model = whisperx.DiarizationPipeline(use_auth_token=st.secrets["HF_TOKEN"], device=device)
|
| 67 |
+
diarize_segments = diarize_model(audio, min_speakers=min_speakers, max_speakers=max_speakers)
|
| 68 |
result_diar = whisperx.assign_word_speakers(diarize_segments, result)
|
| 69 |
|
| 70 |
transcript = convert_segments_object_to_text_simple(result_diar)
|
|
|
|
| 94 |
|
| 95 |
with st.spinner('Резюмируем...'):
|
| 96 |
if (llm == 'GigaChat'):
|
| 97 |
+
summary_answer = get_completion_from_gigachat(base_prompt + transcript, 1024, access_token)
|
| 98 |
elif (llm == 'Chat GPT'):
|
| 99 |
+
summary_answer = get_completion_from_openai(base_prompt + transcript, 1024)
|
| 100 |
|
| 101 |
st.write("Результат резюмирования:")
|
| 102 |
st.text(summary_answer)
|