unijoh commited on
Commit
3711ce8
·
verified ·
1 Parent(s): 05312f4

Upload app.py

Browse files
Files changed (1) hide show
  1. app.py +24 -6
app.py CHANGED
@@ -670,23 +670,41 @@ def _write_tsv(df: pd.DataFrame, filename: str) -> str:
670
  return path
671
 
672
  def build_download_main(rows_state) -> str:
673
- """TSV with 2 columns: Faroese analysis, then English analysis."""
674
- fo_vals, en_vals = [], []
 
 
675
  for r in (rows_state or []):
676
  vec = torch.tensor(r["vec"])
 
 
 
677
  fo_vals.append(analysis_text(vec, "fo"))
678
  en_vals.append(analysis_text(vec, "en"))
679
- df = pd.DataFrame({UI["fo"]["s"]: fo_vals, UI["en"]["s"]: en_vals})
 
 
 
 
 
 
680
  return _write_tsv(df, "Markað.tsv")
681
 
682
  def build_download_expanded(rows_state, lang: str) -> str:
683
- """TSV with the Expanded tags column in the currently selected UI language."""
684
  lang = "fo" if lang == "fo" else "en"
685
- vals = []
686
  for r in (rows_state or []):
687
  vec = torch.tensor(r["vec"])
 
 
 
688
  vals.append(expanded_text(vec, lang))
689
- df = pd.DataFrame({UI[lang]["m"]: vals})
 
 
 
 
690
  return _write_tsv(df, "Markað_útgreinað.tsv")
691
 
692
  with gr.Blocks(css=CSS, title="Marka") as demo:
 
670
  return path
671
 
672
  def build_download_main(rows_state) -> str:
673
+ """TSV with 4 columns:
674
+ Orð, Mark, Útgreining (FO), Analysis (EN)
675
+ """
676
+ words, tags, fo_vals, en_vals = [], [], [], []
677
  for r in (rows_state or []):
678
  vec = torch.tensor(r["vec"])
679
+ tag = vector_to_tag(vec)
680
+ words.append(r["word"])
681
+ tags.append(tag)
682
  fo_vals.append(analysis_text(vec, "fo"))
683
  en_vals.append(analysis_text(vec, "en"))
684
+
685
+ df = pd.DataFrame({
686
+ UI["fo"]["w"]: words,
687
+ UI["fo"]["t"]: tags,
688
+ UI["fo"]["s"]: fo_vals,
689
+ UI["en"]["s"]: en_vals,
690
+ })
691
  return _write_tsv(df, "Markað.tsv")
692
 
693
  def build_download_expanded(rows_state, lang: str) -> str:
694
+ """TSV with 3 columns: Word/Orð, Tag/Mark, and Expanded tags in the UI language."""
695
  lang = "fo" if lang == "fo" else "en"
696
+ words, tags, vals = [], [], []
697
  for r in (rows_state or []):
698
  vec = torch.tensor(r["vec"])
699
+ tag = vector_to_tag(vec)
700
+ words.append(r["word"])
701
+ tags.append(tag)
702
  vals.append(expanded_text(vec, lang))
703
+ df = pd.DataFrame({
704
+ UI[lang]["w"]: words,
705
+ UI[lang]["t"]: tags,
706
+ UI[lang]["m"]: vals,
707
+ })
708
  return _write_tsv(df, "Markað_útgreinað.tsv")
709
 
710
  with gr.Blocks(css=CSS, title="Marka") as demo: