File size: 8,042 Bytes
f09eba4
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
# app_fixed.py
import gradio as gr
import os
import time
import datetime
import config

# Import modules with error handling
try:
    from modules.tts_handler import text_to_speech_file
    from modules.stt_handler import transcribe_audio
    from modules.doc_processor import extract_text_from_document
    from modules.llm_handler import generate_question, evaluate_answer
    from modules.report_generator import generate_pdf_report
    TTS_AVAILABLE = True
except ImportError as e:
    print(f"Warning: Some modules could not be imported: {e}")
    TTS_AVAILABLE = False

def start_interview(interview_type, doc_file, name, num_questions):
    if not interview_type or not doc_file:
        return (
            {},  # state
            [["System", "Please select an interview type and upload a document to begin."]],  # chatbot
            None,  # audio_out
            gr.update(interactive=False),  # audio_in
            gr.update(interactive=True)   # start_btn
        )
    
    try:
        doc_text = extract_text_from_document(doc_file.name)
        if "Error" in doc_text or "Unsupported" in doc_text:
            return (
                {},
                [["System", f"Error: {doc_text}"]],
                None,
                gr.update(interactive=False),
                gr.update(interactive=True)
            )
        
        initial_state = {
            "interview_type": interview_type,
            "doc_text": doc_text,
            "name": name if name else "User",
            "question_count": int(num_questions),
            "current_question_num": 1,
            "interview_log": [],
            "start_time": time.time()
        }
        
        first_question = generate_question(interview_type, doc_text)
        initial_state["current_question_text"] = first_question
        greeting = f"Hello {initial_state['name']}. We'll go through {int(num_questions)} questions today. Here is your first question:"
        
        # Try to generate TTS audio, but don't fail if it's not available
        ai_voice_path = None
        if TTS_AVAILABLE:
            try:
                tts_prompt = f"{greeting} {first_question}"
                ai_voice_path = text_to_speech_file(tts_prompt)
            except Exception as e:
                print(f"TTS generation failed: {e}")
        
        return (
            initial_state,
            [["System", f"{greeting}\n\n{first_question}"]],
            ai_voice_path,
            gr.update(interactive=True),
            gr.update(interactive=False)
        )
        
    except Exception as e:
        return (
            {},
            [["System", f"An error occurred: {str(e)}"]],
            None,
            gr.update(interactive=False),
            gr.update(interactive=True)
        )

def handle_interview_turn(user_audio, chatbot_history, current_state):
    if not current_state or not user_audio:
        return current_state, chatbot_history, None, gr.update(interactive=True), gr.update(visible=False)
    
    try:
        user_answer_text = transcribe_audio(user_audio)
        new_history = chatbot_history + [[user_answer_text, None]]
        
        evaluation_text = evaluate_answer(current_state["current_question_text"], user_answer_text)
        current_state["interview_log"].append({
            "question": current_state["current_question_text"],
            "answer": user_answer_text,
            "evaluation": evaluation_text
        })
        
        if current_state["current_question_num"] >= current_state["question_count"]:
            end_message = "This concludes the interview. Generating your final report now."
            final_history = new_history + [["System", end_message]]
            
            # Generate PDF
            pdf_path = generate_pdf_file(current_state)
            
            # Try TTS
            ai_voice_path = None
            if TTS_AVAILABLE:
                try:
                    ai_voice_path = text_to_speech_file(end_message)
                except Exception as e:
                    print(f"TTS generation failed: {e}")
            
            return (
                current_state,
                final_history,
                ai_voice_path,
                gr.update(interactive=False),
                gr.update(value=pdf_path, visible=True)
            )
        else:
            current_state["current_question_num"] += 1
            next_question = generate_question(current_state["interview_type"], current_state["doc_text"])
            current_state["current_question_text"] = next_question
            q_num = current_state["current_question_num"]
            transition_message = f"Thank you. Here is question {q_num}:\n\n{next_question}"
            final_history = new_history + [["System", transition_message]]
            
            # Try TTS
            ai_voice_path = None
            if TTS_AVAILABLE:
                try:
                    ai_voice_path = text_to_speech_file(transition_message)
                except Exception as e:
                    print(f"TTS generation failed: {e}")
            
            return (
                current_state,
                final_history,
                ai_voice_path,
                gr.update(interactive=True),
                gr.update(visible=False)
            )
            
    except Exception as e:
        error_history = chatbot_history + [["System", f"An error occurred: {str(e)}"]]
        return current_state, error_history, None, gr.update(interactive=True), gr.update(visible=False)

def generate_pdf_file(state):
    try:
        total_duration_minutes = (time.time() - state.get("start_time", time.time())) / 60
        final_data = { 
            "name": state.get("name", "N/A"), 
            "type": state.get("interview_type", "N/A"), 
            "duration": total_duration_minutes,
            "q_and_a": state.get("interview_log", [])
        }
        file_name = f"Report_{state.get('name', 'User')}_{datetime.datetime.now().strftime('%Y-%m-%d')}.pdf"
        file_path = os.path.join(config.REPORT_FOLDER, file_name)
        generate_pdf_report(final_data, file_path)
        return file_path
    except Exception as e:
        print(f"PDF generation failed: {e}")
        return None

with gr.Blocks(theme=gr.themes.Default()) as app:
    state = gr.State(value={})
    
    gr.Markdown("# PM Interview Coach")
    
    with gr.Row():
        with gr.Column(scale=1):
            gr.Markdown("### Setup")
            user_name = gr.Textbox(label="Your Name", placeholder="Enter your name")
            interview_type_dd = gr.Dropdown(choices=config.INTERVIEW_TYPES, label="Interview Type")
            num_questions_slider = gr.Slider(minimum=1, maximum=10, value=5, step=1, label="Number of Questions")
            doc_uploader = gr.File(label="Upload Resume/CV (.pdf, .docx)", file_types=['.pdf', '.docx'])
            start_btn = gr.Button("Start Interview", variant="primary")
        
        with gr.Column(scale=2):
            chatbot = gr.Chatbot(label="Conversation", height=500)
            audio_in = gr.Audio(sources=["microphone"], type="filepath", label="Record Your Answer", interactive=False)
            audio_out = gr.Audio(visible=False, autoplay=True)
            download_pdf_btn = gr.File(label="Download Report", visible=False)

    # Event handlers
    start_btn.click(
        fn=start_interview,
        inputs=[interview_type_dd, doc_uploader, user_name, num_questions_slider],
        outputs=[state, chatbot, audio_out, audio_in, start_btn]
    )
    
    audio_in.stop_recording(
        fn=handle_interview_turn,
        inputs=[audio_in, chatbot, state],
        outputs=[state, chatbot, audio_out, audio_in, download_pdf_btn]
    )

if __name__ == "__main__":
    # Create necessary directories
    os.makedirs(config.UPLOAD_FOLDER, exist_ok=True)
    os.makedirs(config.REPORT_FOLDER, exist_ok=True)
    
    # Launch the app
    app.launch(
        server_name="0.0.0.0",
        server_port=7860,
        share=False
    )