Ubuntu commited on
Commit
f201052
·
1 Parent(s): 115b19d

Process curly quotes

Browse files
Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -11,7 +11,7 @@ def extract_dialogues_with_context_from_text(raw_text, context_window=1):
11
  lines = [line.strip() for line in raw_text.splitlines() if line.strip()]
12
  dialogue_data = []
13
  for i, line in enumerate(lines):
14
- quotes = re.findall(r'"([^"]+)"', line)
15
  for quote in quotes:
16
  context_lines = lines[max(0, i - context_window): i] + lines[i+1: i+1 + context_window]
17
  context = " ".join(context_lines)
 
11
  lines = [line.strip() for line in raw_text.splitlines() if line.strip()]
12
  dialogue_data = []
13
  for i, line in enumerate(lines):
14
+ quotes = re.findall(r'[“"]([^"]+)[”"]', line)
15
  for quote in quotes:
16
  context_lines = lines[max(0, i - context_window): i] + lines[i+1: i+1 + context_window]
17
  context = " ".join(context_lines)