Spaces:

DarylT01
/

dfa-ui

Sleeping

App Files Files Community

DarylT01 commited on May 1, 2024

Commit

15e4f2e

1 Parent(s): fc5e51e

feat(type): identify word type

Browse files

Files changed (6) hide show

adjectives.txt +3 -0
adverbs.txt +3 -0
app.py +76 -33
conjunctions.txt +3 -0
main.py +1 -1
words.txt +0 -42

adjectives.txt ADDED Viewed

	@@ -0,0 +1,3 @@

+and
+but
+or

adverbs.txt ADDED Viewed

	@@ -0,0 +1,3 @@

+nor
+for
+yet

app.py CHANGED Viewed

@@ -6,19 +6,29 @@ from essential_generators import DocumentGenerator
 from main import generate_dfa
 # DataFrame
-words = []
-with open("words.txt") as file:
-    words = file.read().splitlines()
-    words = [word.strip() for word in words]
-    df = pd.DataFrame(
-        {
-            "Words": words,
-        }
-    )
 # DFA function call
-dfa = generate_dfa(words)
 # Generate examples
@@ -36,9 +46,11 @@ def color_match(text: gr.Textbox):
     pointer = 0
     # Get the result of the DFA check on the input text
-    match_dict = dfa.check(text)
-    if not match_dict:
         return (
             '<div style="background-color: #dc2626; color: #fff; text-align: center; width: 100%; padding: 10px; font-weight:800; font-size:1.5rem">Rejected</div>',
             None,
@@ -47,9 +59,21 @@ def color_match(text: gr.Textbox):
     # Flatten the match_dict into a list of tuples and sort by the start index
     matches = sorted(
-        (start, end, word)
-        for word, indices in match_dict.items()
-        for start, end in indices
     )
     for start, end, word in matches:
@@ -64,23 +88,40 @@ def color_match(text: gr.Textbox):
     # Combine the strings
     colored_text = "".join(colored_text)
-    # Call getPositions function and get the DataFrame
-    positions_df = getPositions(text)
-    return colored_text, positions_df
-# Get positions function
-def getPositions(text):
-    match_dict = dfa.check(text)
-    positions_df = pd.DataFrame(columns=["Words", "Positions", "Occurences"])
-    for word, positions in match_dict.items():
         # Convert the list of tuples to a string
         positions_str = ", ".join(map(str, positions))
         # Store the word and the positions string in the wordPositions dictionary
-        positions_df.loc[len(positions_df)] = [word, positions_str, len(positions)]
-    return positions_df
 # Search and display function
@@ -132,13 +173,15 @@ with gr.Blocks() as demo:
             label="Search",
             placeholder="Search accepted words here",
             lines=1,
-            info="List of accpetable words in DFA",
             show_copy_button=True,
         )
         with gr.Row():
             cancel_btn = gr.ClearButton(search, variant="stop", interactive=False)
             search_btn = gr.Button(value="Search", variant="primary")
-        resultSearch = gr.Dataframe(df, height=300, col_count=1, headers=["Words"])
         search.change(
             text_change_search,
@@ -187,8 +230,8 @@ with gr.Blocks() as demo:
     # positionTitle = gr.HTML("<h2 style='color: gold;'>Position</h2>")
     position = gr.Dataframe(
         show_label=True,
-        col_count=3,
-        headers=["Words", "Positions", "Occurences"],
         interactive=False,
     )

 from main import generate_dfa
 # DataFrame
+conjunctions = []
+with open("conjunctions.txt") as file:
+    conjunctions = file.read().splitlines()
+    conjunctions = [word.strip() for word in conjunctions]
+with open("adverbs.txt") as file:
+    adverbs = file.read().splitlines()
+    adverbs = [word.strip() for word in adverbs]
+with open("adjectives.txt") as file:
+    adjectives = file.read().splitlines()
+    adjectives = [word.strip() for word in adjectives]
+df = pd.DataFrame(columns=["Words", "Type"])
+for i in conjunctions:
+    df.loc[len(df)] = [i, "Conjunction"]
+for i in adverbs:
+    df.loc[len(df)] = [i, "Adverb"]
+for i in adjectives:
+    df.loc[len(df)] = [i, "Adjective"]
 # DFA function call
+dfa_conjunctions = generate_dfa(conjunctions)
+dfa_adverbs = generate_dfa(adverbs)
+dfa_adjectives = generate_dfa(adjectives)
 # Generate examples
     pointer = 0
     # Get the result of the DFA check on the input text
+    match_dict_conj = dfa_conjunctions.check(text)
+    match_dict_adv = dfa_adverbs.check(text)
+    match_dict_adj = dfa_adjectives.check(text)
+    if not match_dict_conj and not match_dict_adv and not match_dict_adj:
         return (
             '<div style="background-color: #dc2626; color: #fff; text-align: center; width: 100%; padding: 10px; font-weight:800; font-size:1.5rem">Rejected</div>',
             None,
     # Flatten the match_dict into a list of tuples and sort by the start index
     matches = sorted(
+        [
+            (start, end, word)
+            for word, indices in match_dict_conj.items()
+            for start, end in indices
+        ]
+        + [
+            (start, end, word)
+            for word, indices in match_dict_adv.items()
+            for start, end in indices
+        ]
+        + [
+            (start, end, word)
+            for word, indices in match_dict_adj.items()
+            for start, end in indices
+        ]
     )
     for start, end, word in matches:
     # Combine the strings
     colored_text = "".join(colored_text)
+    # Create the DataFrame
+    positions_df = pd.DataFrame(columns=["Words", "Type", "Positions", "Occurences"])
+    for word, positions in match_dict_conj.items():
         # Convert the list of tuples to a string
         positions_str = ", ".join(map(str, positions))
         # Store the word and the positions string in the wordPositions dictionary
+        positions_df.loc[len(positions_df)] = [
+            word,
+            "Conjunction",
+            positions_str,
+            len(positions),
+        ]
+    for word, positions in match_dict_adv.items():
+        # Convert the list of tuples to a string
+        positions_str = ", ".join(map(str, positions))
+        # Store the word and the positions string in the wordPositions dictionary
+        positions_df.loc[len(positions_df)] = [
+            word,
+            "Adverb",
+            positions_str,
+            len(positions),
+        ]
+    for word, positions in match_dict_adj.items():
+        # Convert the list of tuples to a string
+        positions_str = ", ".join(map(str, positions))
+        # Store the word and the positions string in the wordPositions dictionary
+        positions_df.loc[len(positions_df)] = [
+            word,
+            "Adjective",
+            positions_str,
+            len(positions),
+        ]
+    return colored_text, positions_df
 # Search and display function
             label="Search",
             placeholder="Search accepted words here",
             lines=1,
+            info="List of acceptable words in DFA",
             show_copy_button=True,
         )
         with gr.Row():
             cancel_btn = gr.ClearButton(search, variant="stop", interactive=False)
             search_btn = gr.Button(value="Search", variant="primary")
+        resultSearch = gr.Dataframe(
+            df, height=300, col_count=2, headers=["Words", "Type"]
+        )
         search.change(
             text_change_search,
     # positionTitle = gr.HTML("<h2 style='color: gold;'>Position</h2>")
     position = gr.Dataframe(
         show_label=True,
+        col_count=4,
+        headers=["Words", "Type", "Positions", "Occurences"],
         interactive=False,
     )

conjunctions.txt ADDED Viewed

	@@ -0,0 +1,3 @@

+subsequently
+meanwhile
+afterwards

main.py CHANGED Viewed

@@ -37,7 +37,7 @@ class DFA:
         chars = list(paragraph)
         current_word = ""
-        accepted_words: dict[list[tuple[int, int]]] = (
             {}
         )  # returns: {word: [(start_index, end_index)]}

         chars = list(paragraph)
         current_word = ""
+        accepted_words: dict[str : list[tuple[int, int]]] = (
             {}
         )  # returns: {word: [(start_index, end_index)]}

words.txt DELETED Viewed

@@ -1,42 +0,0 @@
-and
-but
-or
-nor
-for
-yet
-so
-although
-though
-because
-since
-until
-after
-before
-as
-if
-once
-provided
-that
-unless
-whereas
-while
-lest
-whether
-however
-moreover
-nevertheless
-nonetheless
-consequently
-therefore
-thus
-hence
-besides
-furthermore
-otherwise
-instead
-similarly
-likewise
-accordingly
-subsequently
-meanwhile
-afterwards