Spanicin commited on
Commit
840ea2e
·
verified ·
1 Parent(s): ea7ec3a

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -290,7 +290,7 @@ def run_preprocessing(args):
290
  # return cleaned_text.strip()
291
 
292
  def extract_content(data):
293
- pattern = r'"content":"(.*?)"'
294
  match = re.search(pattern, data)
295
  if match:
296
  return match.group(1)
 
290
  # return cleaned_text.strip()
291
 
292
  def extract_content(data):
293
+ pattern = r'"content":"((?:\\.|[^"\\])*)"'
294
  match = re.search(pattern, data)
295
  if match:
296
  return match.group(1)