Spaces:
Sleeping
Sleeping
Ubuntu commited on
Commit ·
f201052
1
Parent(s): 115b19d
Process curly quotes
Browse files
app.py
CHANGED
|
@@ -11,7 +11,7 @@ def extract_dialogues_with_context_from_text(raw_text, context_window=1):
|
|
| 11 |
lines = [line.strip() for line in raw_text.splitlines() if line.strip()]
|
| 12 |
dialogue_data = []
|
| 13 |
for i, line in enumerate(lines):
|
| 14 |
-
quotes = re.findall(r'"([^"]+)"', line)
|
| 15 |
for quote in quotes:
|
| 16 |
context_lines = lines[max(0, i - context_window): i] + lines[i+1: i+1 + context_window]
|
| 17 |
context = " ".join(context_lines)
|
|
|
|
| 11 |
lines = [line.strip() for line in raw_text.splitlines() if line.strip()]
|
| 12 |
dialogue_data = []
|
| 13 |
for i, line in enumerate(lines):
|
| 14 |
+
quotes = re.findall(r'[“"]([^”"]+)[”"]', line)
|
| 15 |
for quote in quotes:
|
| 16 |
context_lines = lines[max(0, i - context_window): i] + lines[i+1: i+1 + context_window]
|
| 17 |
context = " ".join(context_lines)
|