Spaces:

GeetaAIVisionary
/

nvidia-nemo-guardrails-demo

Sleeping

App Files Files Community

GeetaAIVisionary commited on Aug 17

Commit

eda4493

verified ·

1 Parent(s): ea612ad

Update app.py

Browse files

Files changed (1) hide show

app.py +95 -191

app.py CHANGED Viewed

@@ -1,204 +1,108 @@
-# app.py
-# CLI-like Spelling Bee Tutor as a simple Gradio UI (no LLMs, all offline)
-import gradio as gr
-import pandas as pd
 from pathlib import Path
-WORDS_PATH = Path("words.csv")
-def _load_words():
-    """Load CSV; ensure we have a 'word' column; create optional columns if missing.
-    Also compute a difficulty score (fallback = word length)."""
-    if not WORDS_PATH.exists():
-        # return empty df with expected columns
-        return pd.DataFrame(columns=["word", "definition", "origin", "sentence", "difficulty_score"])
-    df = pd.read_csv(WORDS_PATH)
-    # normalize required/optional columns
-    if "word" not in df.columns:
-        # treat first column as 'word'
-        df = df.rename(columns={df.columns[0]: "word"})
-    for col in ["definition", "origin", "sentence"]:
-        if col not in df.columns:
-            df[col] = ""
-    # difficulty: use numeric 'difficulty' if present; else use length
     if "difficulty" in df.columns:
         ds = pd.to_numeric(df["difficulty"], errors="coerce").fillna(0)
         df["difficulty_score"] = ds
     else:
         df["difficulty_score"] = df["word"].astype(str).str.len()
-    # sort hardest -> easiest
     df = df.sort_values("difficulty_score", ascending=False).reset_index(drop=True)
     return df
-DF = _load_words()
-def _summary(state):
-    if not state:
-        return "No round active."
-    n = state["n"]
-    score = state["score"]
-    return f"Round complete. Score this round: {score}/{n}."
-def start_quiz(n_words, state):
-    df = DF
-    if df.empty:
-        # disable input if no words
-        return (state,
-                "words.csv not found or empty.",
-                gr.update(value="", interactive=False),
-                "Please add a words.csv with at least one 'word' column.",
-                "Score: 0/0",
-                gr.update(value="", interactive=False))
-    try:
-        n = int(n_words or 5)
-    except Exception:
-        n = 5
-    # clip to available size
-    n = max(1, min(n, len(df)))
-    # take top-n hardest words
-    block = df.head(n).reset_index(drop=True)
-    s = {
-        "i": 0,
-        "n": n,
-        "score": 0,
-        "words": block["word"].astype(str).tolist(),
-        "defs": block["definition"].astype(str).tolist(),
-        "orig": block["origin"].astype(str).tolist(),
-        "sent": block["sentence"].astype(str).tolist(),
-    }
-    current = s["words"][0]
-    hist = f"Okay! We'll do {n} words this round, hardest → easiest.\nSpell this word: {current}"
-    status = "Type your spelling attempt, or click definition/origin/sentence."
-    return s, hist, gr.update(value=current, interactive=False), status, f"Score: 0/{n}", gr.update(value="", interactive=True)
-def _check_state(state):
-    if not state or "words" not in state or state["i"] >= state["n"]:
-        return False
-    return True
-def check_attempt(state, attempt, history, current_word, score_md):
-    if not _check_state(state):
-        return state, history, current_word, "No round active. Click Start.", score_md, gr.update(value="")
-    attempt = (attempt or "").strip()
-    if not attempt:
-        return state, history, current_word, "Type your attempt first.", score_md, gr.update(value="")
-    target = state["words"][state["i"]]
-    if attempt.lower() == target.lower():
-        state["score"] += 1
-        msg = "✅ Correct!"
-    else:
-        msg = "❌ Not quite. Try again or ask for definition/origin/sentence."
-    # append to history
-    history = f"{history}\nYou: {attempt}\nTutor: {msg}"
-    score_md = f"Score: {state['score']}/{state['n']}"
-    return state, history, current_word, msg, score_md, gr.update(value="")
-def _safe_text(val, fallback="Not available."):
-    v = (val or "").strip()
-    return v if v else fallback
-def show_def(state, history, current_word, score_md):
-    if not _check_state(state):
-        return state, history, current_word, "No round active. Click Start.", score_md
-    i = state["i"]
-    word = state["words"][i]
-    text = _safe_text(state["defs"][i])
-    history = f"{history}\nTutor (definition of {word}): {text}"
-    return state, history, current_word, f"Definition of {word}: {text}", score_md
-def show_origin(state, history, current_word, score_md):
-    if not _check_state(state):
-        return state, history, current_word, "No round active. Click Start.", score_md
-    i = state["i"]
-    word = state["words"][i]
-    text = _safe_text(state["orig"][i])
-    history = f"{history}\nTutor (origin of {word}): {text}"
-    return state, history, current_word, f"Origin of {word}: {text}", score_md
-def show_sentence(state, history, current_word, score_md):
-    if not _check_state(state):
-        return state, history, current_word, "No round active. Click Start.", score_md
-    i = state["i"]
-    word = state["words"][i]
-    text = _safe_text(state["sent"][i])
-    history = f"{history}\nTutor (sentence with {word}): {text}"
-    return state, history, current_word, f"Sentence: {text}", score_md
-def next_word(state, history, current_word, score_md):
-    if not _check_state(state):
-        return state, history, current_word, "No round active. Click Start.", score_md
-    state["i"] += 1
-    if state["i"] >= state["n"]:
-        # finished
-        summary = _summary(state)
-        history = f"{history}\n{summary}"
-        return {}, history, gr.update(value="", interactive=False), summary, f"Score: {state['score']}/{state['n']}"
-    # go to next word
-    w = state["words"][state["i"]]
-    history = f"{history}\nNext word: {w}"
-    status = "Type your spelling attempt, or click definition/origin/sentence."
-    return state, history, gr.update(value=w, interactive=False), status, f"Score: {state['score']}/{state['n']}"
-def stop_round(state, history, current_word, score_md):
-    if not state:
-        return {}, history, current_word, "Stopped.", score_md
-    summary = _summary(state)
-    history = f"{history}\n{summary}"
-    return {}, history, gr.update(value="", interactive=False), "Stopped.", f"Score: {state['score']}/{state['n']}"
-with gr.Blocks() as demo:
-    gr.Markdown("# NeMo Guardrails Demo (starter UI)\n**CLI-style spelling quiz** — works offline from `words.csv`.")
-    with gr.Row():
-        n_words = gr.Number(value=5, precision=0, label="Words this round")
-        start = gr.Button("Start quiz")
-    current_word = gr.Textbox(label="Spell this word", interactive=False)
-    attempt = gr.Textbox(label="Your attempt")
-    with gr.Row():
-        check = gr.Button("Check")
-        bdef = gr.Button("definition")
-        borg = gr.Button("origin")
-        bsent = gr.Button("sentence")
-        bnext = gr.Button("next")
-        bstop = gr.Button("stop")
-    status = gr.Markdown("")
-    score_md = gr.Markdown("Score: 0/0")
-    history = gr.Textbox(label="History", lines=14)
-    state = gr.State({})
-    # wire events
-    start.click(start_quiz, [n_words, state],
-                [state, history, current_word, status, score_md, attempt])
-    check.click(check_attempt, [state, attempt, history, current_word, score_md],
-                [state, history, current_word, status, score_md, attempt])
-    bdef.click(show_def, [state, history, current_word, score_md],
-               [state, history, current_word, status, score_md], queue=False)
-    borg.click(show_origin, [state, history, current_word, score_md],
-               [state, history, current_word, status, score_md], queue=False)
-    bsent.click(show_sentence, [state, history, current_word, score_md],
-                [state, history, current_word, status, score_md], queue=False)
-    bnext.click(next_word, [state, history, current_word, score_md],
-                [state, history, current_word, status, score_md], queue=False)
-    bstop.click(stop_round, [state, history, current_word, score_md],
-                [state, history, current_word, status, score_md], queue=False)
-if __name__ == "__main__":
-    demo.launch()

 from pathlib import Path
+import pandas as pd
+import csv
+# make path robust in Spaces
+WORDS_PATH = Path(__file__).parent / "words.csv"
+EXPECTED_COLS = ["word", "difficulty", "definition", "origin", "sentence"]
+def _load_words(path: Path = WORDS_PATH) -> pd.DataFrame:
+    """Load a possibly-messy CSV:
+       - tolerate commas inside sentence/origin
+       - accept exact 5 columns or more (extras glued into sentence)
+       - create missing optional columns
+    """
+    if not path.exists():
+        return pd.DataFrame(columns=["word", "definition", "origin", "sentence", "difficulty_score"])
+    rows = []
+    with open(path, "r", encoding="utf-8", newline="") as f:
+        # try a forgiving CSV read first (honors quotes like "…")
+        try:
+            df_try = pd.read_csv(
+                f,
+                engine="python",
+                quotechar='"',
+                escapechar='\\',
+                dtype=str,
+                keep_default_na=False
+            )
+            # If it parsed to 5+ columns, normalize below
+            df = df_try
+        except Exception:
+            # fall back to manual glue if pandas fails
+            f.seek(0)
+            reader = csv.reader(f)
+            header = next(reader, None)
+            header_ok = header and [h.strip().lower() for h in header[:5]] == EXPECTED_COLS
+            if not header_ok:
+                # treat first line as data
+                f.seek(0)
+                reader = csv.reader(f)
+            for row in reader:
+                if not row or all((x is None or str(x).strip() == "") for x in row):
+                    continue
+                # expect at least 5 fields; if more, glue extras into sentence
+                if len(row) < 5:
+                    # pad empty fields to avoid crash
+                    row = row + [""] * (5 - len(row))
+                base = row[:4]
+                sentence = ",".join(row[4:])  # glue any extras back
+                rows.append([*(str(x).strip() for x in base), sentence.strip()])
+            df = pd.DataFrame(rows, columns=EXPECTED_COLS)
+    # --- Normalize columns ---
+    cols = [c.strip().lower() for c in df.columns]
+    mapper = {c: c.strip().lower() for c in df.columns}
+    df = df.rename(columns=mapper)
+    # If there are more than 5 columns, rebuild to our schema
+    if df.shape[1] >= 5:
+        # take first four known fields if present, then glue rest into sentence
+        def pick(colname, default=""):
+            return df[colname] if colname in df.columns else default
+        base_df = pd.DataFrame({
+            "word": pick("word", ""),
+            "difficulty": pick("difficulty", ""),
+            "definition": pick("definition", ""),
+            "origin": pick("origin", ""),
+        })
+        # sentence = existing sentence + any extra cols joined by commas
+        extras = []
+        if "sentence" in df.columns:
+            extras.append(df["sentence"].astype(str))
+        extra_cols = [c for c in df.columns if c not in {"word","difficulty","definition","origin","sentence"}]
+        for c in extra_cols:
+            extras.append(df[c].astype(str))
+        if extras:
+            sentence_series = extras[0]
+            for s in extras[1:]:
+                sentence_series = sentence_series.str.cat(s, sep=",", na_rep="")
+        else:
+            sentence_series = pd.Series([""] * len(base_df))
+        base_df["sentence"] = sentence_series
+        df = base_df
+    else:
+        # ensure missing optional cols exist
+        for c in ["definition", "origin", "sentence", "difficulty"]:
+            if c not in df.columns:
+                df[c] = ""
+    # Clean and type
+    df["word"] = df["word"].astype(str).fillna("").str.strip()
+    df["definition"] = df["definition"].astype(str).fillna("").str.strip()
+    df["origin"] = df["origin"].astype(str).fillna("").str.strip()
+    df["sentence"] = df["sentence"].astype(str).fillna("").str.strip()
+    # difficulty score
     if "difficulty" in df.columns:
         ds = pd.to_numeric(df["difficulty"], errors="coerce").fillna(0)
         df["difficulty_score"] = ds
     else:
         df["difficulty_score"] = df["word"].astype(str).str.len()
+    # sort hardest → easiest
     df = df.sort_values("difficulty_score", ascending=False).reset_index(drop=True)
     return df