Update process_interview.py
Browse files- process_interview.py +2 -1
process_interview.py
CHANGED
|
@@ -157,7 +157,8 @@ def identify_speakers(transcript: Dict, wav_file_path: str) -> List[Dict]:
|
|
| 157 |
'speaker_name': match['metadata'].get('speaker_name', 'Unknown Speaker')}
|
| 158 |
else:
|
| 159 |
speaker_id = f"speaker_{uuid.uuid4().hex[:8]}"
|
| 160 |
-
|
|
|
|
| 161 |
index.upsert(vectors=[(speaker_id, embedding, {"speaker_name": speaker_name})])
|
| 162 |
return {**utterance, 'speaker_id': speaker_id, 'speaker_name': speaker_name}
|
| 163 |
|
|
|
|
| 157 |
'speaker_name': match['metadata'].get('speaker_name', 'Unknown Speaker')}
|
| 158 |
else:
|
| 159 |
speaker_id = f"speaker_{uuid.uuid4().hex[:8]}"
|
| 160 |
+
vector_count = index.describe_index_stats()['namespaces'].get('default', {}).get('vector_count', 0)
|
| 161 |
+
speaker_name = f"Speaker {vector_count + 1 if vector_count >= 0 else 1}"
|
| 162 |
index.upsert(vectors=[(speaker_id, embedding, {"speaker_name": speaker_name})])
|
| 163 |
return {**utterance, 'speaker_id': speaker_id, 'speaker_name': speaker_name}
|
| 164 |
|