Spaces:

skalyan91
/

readability-feedback

Sleeping

App Files Files Community

skalyan91 commited on Jan 4

Commit

5b44626

verified ·

1 Parent(s): a6daf52

deploy at 2026-01-04 16:38:37.435466

Browse files

Files changed (4) hide show

Dependency length.ipynb +72 -55
main.py +308 -62
sample_parse.svg +406 -0
sample_parse_2.svg +406 -0

Dependency length.ipynb CHANGED Viewed

@@ -68,7 +68,8 @@
     "        if token.dep_ == \"prep\" and token.head.pos_ in [\"VERB\", \"AUX\"] and \\\n",
     "           ((len(list(token.head.rights)) >= 1 and token == list(token.head.rights)[0]) or \n",
     "            (len(list(token.head.rights)) >= 2 and \n",
-    "             list(token.head.rights)[0].dep_ == \"dobj\" and token == list(token.head.rights)[1])):\n",
     "            token.dep_ = \"comp\"\n",
     "        if token.dep_ == \"ccomp\" and any(sibling.dep_ in relations[\"comp\"] \n",
     "                                         for sibling in token.head.rights if sibling.i < token.i):\n",
@@ -122,12 +123,13 @@
    "outputs": [],
    "source": [
     "def flyover(token):\n",
-    "    if token.dep_ in [\"subj\", \"comp\", \"conj\"]:\n",
-    "        dep_distance = abs(token.i - token.head.i)\n",
     "        if token.head.i < token.i:\n",
-    "            return (token.doc[token.head.i+1:token.i], dep_distance - 1)\n",
     "        elif token.head.i > token.i:\n",
-    "            return (token.doc[token.i+1:token.head.i], dep_distance - 1)\n",
     "    else:\n",
     "        return (token.doc[token.i:token.i], 0)"
    ]
@@ -144,7 +146,7 @@
     "    flyovers = [f for f in flyovers if len(f[0]) > 0]\n",
     "    flyovers = [f1 for f1 in flyovers if len([f2 for f2 in flyovers if \n",
     "                                              (f2[0][-1].i > f1[0][0].i >= f2[0][0].i or f2[0][0].i < f1[0][-1].i <= f2[0][-1].i) and \n",
-    "                                              (len(f1[0]) < len(f2[0]) or f1[1] < f2[1])]) == 0 and len(f1[0]) > 2]\n",
     "    flyovers = sorted(flyovers, key=lambda x: x[0][0].i)\n",
     "    interstices = []\n",
     "    for i in range(len(flyovers)):\n",
@@ -168,108 +170,121 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 6,
    "id": "ba90ff19-c665-49d8-8ad4-5caee885901d",
    "metadata": {},
    "outputs": [
     {
      "data": {
       "text/html": [
-       "<span class=\"tex2jax_ignore\"><svg xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\" xml:lang=\"en\" id=\"7cae4e9aeafb4cf4bd557e4780eb30b6-0\" class=\"displacy\" width=\"1450\" height=\"399.5\" direction=\"ltr\" style=\"max-width: none; height: 399.5px; color: #000000; background: #ffffff; font-family: Arial; direction: ltr\">\n",
-       "<text class=\"displacy-token\" fill=\"currentColor\" text-anchor=\"middle\" y=\"309.5\">\n",
-       "    <tspan class=\"displacy-word\" fill=\"currentColor\" x=\"50\">They</tspan>\n",
-       "    <tspan class=\"displacy-tag\" dy=\"2em\" fill=\"currentColor\" x=\"50\">PRON</tspan>\n",
        "</text>\n",
        "\n",
-       "<text class=\"displacy-token\" fill=\"currentColor\" text-anchor=\"middle\" y=\"309.5\">\n",
-       "    <tspan class=\"displacy-word\" fill=\"currentColor\" x=\"225\">designated</tspan>\n",
-       "    <tspan class=\"displacy-tag\" dy=\"2em\" fill=\"currentColor\" x=\"225\">VERB</tspan>\n",
        "</text>\n",
        "\n",
-       "<text class=\"displacy-token\" fill=\"currentColor\" text-anchor=\"middle\" y=\"309.5\">\n",
-       "    <tspan class=\"displacy-word\" fill=\"currentColor\" x=\"400\">the</tspan>\n",
-       "    <tspan class=\"displacy-tag\" dy=\"2em\" fill=\"currentColor\" x=\"400\">DET</tspan>\n",
        "</text>\n",
        "\n",
-       "<text class=\"displacy-token\" fill=\"currentColor\" text-anchor=\"middle\" y=\"309.5\">\n",
-       "    <tspan class=\"displacy-word\" fill=\"currentColor\" x=\"575\">building,</tspan>\n",
-       "    <tspan class=\"displacy-tag\" dy=\"2em\" fill=\"currentColor\" x=\"575\">NOUN</tspan>\n",
        "</text>\n",
        "\n",
-       "<text class=\"displacy-token\" fill=\"currentColor\" text-anchor=\"middle\" y=\"309.5\">\n",
-       "    <tspan class=\"displacy-word\" fill=\"currentColor\" x=\"750\">as</tspan>\n",
-       "    <tspan class=\"displacy-tag\" dy=\"2em\" fill=\"currentColor\" x=\"750\">ADP</tspan>\n",
        "</text>\n",
        "\n",
-       "<text class=\"displacy-token\" fill=\"currentColor\" text-anchor=\"middle\" y=\"309.5\">\n",
-       "    <tspan class=\"displacy-word\" fill=\"currentColor\" x=\"925\">a</tspan>\n",
-       "    <tspan class=\"displacy-tag\" dy=\"2em\" fill=\"currentColor\" x=\"925\">DET</tspan>\n",
        "</text>\n",
        "\n",
-       "<text class=\"displacy-token\" fill=\"currentColor\" text-anchor=\"middle\" y=\"309.5\">\n",
-       "    <tspan class=\"displacy-word\" fill=\"currentColor\" x=\"1100\">national</tspan>\n",
-       "    <tspan class=\"displacy-tag\" dy=\"2em\" fill=\"currentColor\" x=\"1100\">ADJ</tspan>\n",
        "</text>\n",
        "\n",
-       "<text class=\"displacy-token\" fill=\"currentColor\" text-anchor=\"middle\" y=\"309.5\">\n",
-       "    <tspan class=\"displacy-word\" fill=\"currentColor\" x=\"1275\">landmark.</tspan>\n",
-       "    <tspan class=\"displacy-tag\" dy=\"2em\" fill=\"currentColor\" x=\"1275\">NOUN</tspan>\n",
        "</text>\n",
        "\n",
        "<g class=\"displacy-arrow\">\n",
-       "    <path class=\"displacy-arc\" id=\"arrow-7cae4e9aeafb4cf4bd557e4780eb30b6-0-0\" stroke-width=\"2px\" d=\"M70,264.5 C70,177.0 215.0,177.0 215.0,264.5\" fill=\"none\" stroke=\"currentColor\"/>\n",
        "    <text dy=\"1.25em\" style=\"font-size: 0.8em; letter-spacing: 1px\">\n",
-       "        <textPath xlink:href=\"#arrow-7cae4e9aeafb4cf4bd557e4780eb30b6-0-0\" class=\"displacy-label\" startOffset=\"50%\" side=\"left\" fill=\"currentColor\" text-anchor=\"middle\">subj</textPath>\n",
        "    </text>\n",
-       "    <path class=\"displacy-arrowhead\" d=\"M70,266.5 L62,254.5 78,254.5\" fill=\"currentColor\"/>\n",
        "</g>\n",
        "\n",
        "<g class=\"displacy-arrow\">\n",
-       "    <path class=\"displacy-arc\" id=\"arrow-7cae4e9aeafb4cf4bd557e4780eb30b6-0-1\" stroke-width=\"2px\" d=\"M420,264.5 C420,177.0 565.0,177.0 565.0,264.5\" fill=\"none\" stroke=\"currentColor\"/>\n",
        "    <text dy=\"1.25em\" style=\"font-size: 0.8em; letter-spacing: 1px\">\n",
-       "        <textPath xlink:href=\"#arrow-7cae4e9aeafb4cf4bd557e4780eb30b6-0-1\" class=\"displacy-label\" startOffset=\"50%\" side=\"left\" fill=\"currentColor\" text-anchor=\"middle\">det</textPath>\n",
        "    </text>\n",
-       "    <path class=\"displacy-arrowhead\" d=\"M420,266.5 L412,254.5 428,254.5\" fill=\"currentColor\"/>\n",
        "</g>\n",
        "\n",
        "<g class=\"displacy-arrow\">\n",
-       "    <path class=\"displacy-arc\" id=\"arrow-7cae4e9aeafb4cf4bd557e4780eb30b6-0-2\" stroke-width=\"2px\" d=\"M245,264.5 C245,89.5 570.0,89.5 570.0,264.5\" fill=\"none\" stroke=\"currentColor\"/>\n",
        "    <text dy=\"1.25em\" style=\"font-size: 0.8em; letter-spacing: 1px\">\n",
-       "        <textPath xlink:href=\"#arrow-7cae4e9aeafb4cf4bd557e4780eb30b6-0-2\" class=\"displacy-label\" startOffset=\"50%\" side=\"left\" fill=\"currentColor\" text-anchor=\"middle\">comp</textPath>\n",
        "    </text>\n",
-       "    <path class=\"displacy-arrowhead\" d=\"M570.0,266.5 L578.0,254.5 562.0,254.5\" fill=\"currentColor\"/>\n",
        "</g>\n",
        "\n",
        "<g class=\"displacy-arrow\">\n",
-       "    <path class=\"displacy-arc\" id=\"arrow-7cae4e9aeafb4cf4bd557e4780eb30b6-0-3\" stroke-width=\"2px\" d=\"M245,264.5 C245,2.0 750.0,2.0 750.0,264.5\" fill=\"none\" stroke=\"currentColor\"/>\n",
        "    <text dy=\"1.25em\" style=\"font-size: 0.8em; letter-spacing: 1px\">\n",
-       "        <textPath xlink:href=\"#arrow-7cae4e9aeafb4cf4bd557e4780eb30b6-0-3\" class=\"displacy-label\" startOffset=\"50%\" side=\"left\" fill=\"currentColor\" text-anchor=\"middle\">udep</textPath>\n",
        "    </text>\n",
-       "    <path class=\"displacy-arrowhead\" d=\"M750.0,266.5 L758.0,254.5 742.0,254.5\" fill=\"currentColor\"/>\n",
        "</g>\n",
        "\n",
        "<g class=\"displacy-arrow\">\n",
-       "    <path class=\"displacy-arc\" id=\"arrow-7cae4e9aeafb4cf4bd557e4780eb30b6-0-4\" stroke-width=\"2px\" d=\"M945,264.5 C945,89.5 1270.0,89.5 1270.0,264.5\" fill=\"none\" stroke=\"currentColor\"/>\n",
        "    <text dy=\"1.25em\" style=\"font-size: 0.8em; letter-spacing: 1px\">\n",
-       "        <textPath xlink:href=\"#arrow-7cae4e9aeafb4cf4bd557e4780eb30b6-0-4\" class=\"displacy-label\" startOffset=\"50%\" side=\"left\" fill=\"currentColor\" text-anchor=\"middle\">det</textPath>\n",
        "    </text>\n",
-       "    <path class=\"displacy-arrowhead\" d=\"M945,266.5 L937,254.5 953,254.5\" fill=\"currentColor\"/>\n",
        "</g>\n",
        "\n",
        "<g class=\"displacy-arrow\">\n",
-       "    <path class=\"displacy-arc\" id=\"arrow-7cae4e9aeafb4cf4bd557e4780eb30b6-0-5\" stroke-width=\"2px\" d=\"M1120,264.5 C1120,177.0 1265.0,177.0 1265.0,264.5\" fill=\"none\" stroke=\"currentColor\"/>\n",
        "    <text dy=\"1.25em\" style=\"font-size: 0.8em; letter-spacing: 1px\">\n",
-       "        <textPath xlink:href=\"#arrow-7cae4e9aeafb4cf4bd557e4780eb30b6-0-5\" class=\"displacy-label\" startOffset=\"50%\" side=\"left\" fill=\"currentColor\" text-anchor=\"middle\">udep</textPath>\n",
        "    </text>\n",
-       "    <path class=\"displacy-arrowhead\" d=\"M1120,266.5 L1112,254.5 1128,254.5\" fill=\"currentColor\"/>\n",
        "</g>\n",
        "\n",
        "<g class=\"displacy-arrow\">\n",
-       "    <path class=\"displacy-arc\" id=\"arrow-7cae4e9aeafb4cf4bd557e4780eb30b6-0-6\" stroke-width=\"2px\" d=\"M770,264.5 C770,2.0 1275.0,2.0 1275.0,264.5\" fill=\"none\" stroke=\"currentColor\"/>\n",
        "    <text dy=\"1.25em\" style=\"font-size: 0.8em; letter-spacing: 1px\">\n",
-       "        <textPath xlink:href=\"#arrow-7cae4e9aeafb4cf4bd557e4780eb30b6-0-6\" class=\"displacy-label\" startOffset=\"50%\" side=\"left\" fill=\"currentColor\" text-anchor=\"middle\">comp</textPath>\n",
        "    </text>\n",
-       "    <path class=\"displacy-arrowhead\" d=\"M1275.0,266.5 L1283.0,254.5 1267.0,254.5\" fill=\"currentColor\"/>\n",
        "</g>\n",
        "</svg></span>"
       ],
@@ -282,9 +297,11 @@
     }
    ],
    "source": [
-    "doc = ssudify(nlp(\"They designated the building, as a national landmark.\"))\n",
     "# Since this is an interactive Jupyter environment, we can use displacy.render here\n",
-    "displacy.render(doc, style='dep')"
    ]
   },
   {

     "        if token.dep_ == \"prep\" and token.head.pos_ in [\"VERB\", \"AUX\"] and \\\n",
     "           ((len(list(token.head.rights)) >= 1 and token == list(token.head.rights)[0]) or \n",
     "            (len(list(token.head.rights)) >= 2 and \n",
+    "             (list(token.head.rights)[0].dep_ == \"dobj\" or list(token.head.rights)[0].pos_ == \"ADV\") and \n",
+    "              token == list(token.head.rights)[1])):\n",
     "            token.dep_ = \"comp\"\n",
     "        if token.dep_ == \"ccomp\" and any(sibling.dep_ in relations[\"comp\"] \n",
     "                                         for sibling in token.head.rights if sibling.i < token.i):\n",
    "outputs": [],
    "source": [
     "def flyover(token):\n",
+    "    if token.dep_ in [\"subj\", \"comp\"]:\n",
+    "        dep_distance = len([t for t in token.doc[min(token.i, token.head.i) + 1 : max(token.i, token.head.i)]\n",
+    "                            if len(list(t.children)) > 0])\n",
     "        if token.head.i < token.i:\n",
+    "            return (token.doc[token.head.i+1:token.i], dep_distance)\n",
     "        elif token.head.i > token.i:\n",
+    "            return (token.doc[token.i+1:token.head.i], dep_distance)\n",
     "    else:\n",
     "        return (token.doc[token.i:token.i], 0)"
    ]
     "    flyovers = [f for f in flyovers if len(f[0]) > 0]\n",
     "    flyovers = [f1 for f1 in flyovers if len([f2 for f2 in flyovers if \n",
     "                                              (f2[0][-1].i > f1[0][0].i >= f2[0][0].i or f2[0][0].i < f1[0][-1].i <= f2[0][-1].i) and \n",
+    "                                              (len(f1[0]) < len(f2[0]) or f1[1] < f2[1])]) == 0 and len(f1[0]) > 0]\n",
     "    flyovers = sorted(flyovers, key=lambda x: x[0][0].i)\n",
     "    interstices = []\n",
     "    for i in range(len(flyovers)):\n",
   },
   {
    "cell_type": "code",
+   "execution_count": 13,
    "id": "ba90ff19-c665-49d8-8ad4-5caee885901d",
    "metadata": {},
    "outputs": [
     {
      "data": {
       "text/html": [
+       "<span class=\"tex2jax_ignore\"><svg xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\" xml:lang=\"en\" id=\"b935f75a06f14438a922ac30e5ab8f72-0\" class=\"displacy\" width=\"950\" height=\"337.0\" direction=\"ltr\" style=\"max-width: none; height: 337.0px; color: #000000; background: #ffffff; font-family: ; direction: ltr\">\n",
+       "<text class=\"displacy-token\" fill=\"currentColor\" text-anchor=\"middle\" y=\"247.0\">\n",
+       "    <tspan class=\"displacy-word\" fill=\"currentColor\" x=\"50\">The</tspan>\n",
+       "    <tspan class=\"displacy-tag\" dy=\"2em\" fill=\"currentColor\" x=\"50\">DET</tspan>\n",
        "</text>\n",
        "\n",
+       "<text class=\"displacy-token\" fill=\"currentColor\" text-anchor=\"middle\" y=\"247.0\">\n",
+       "    <tspan class=\"displacy-word\" fill=\"currentColor\" x=\"150\">manager,</tspan>\n",
+       "    <tspan class=\"displacy-tag\" dy=\"2em\" fill=\"currentColor\" x=\"150\">NOUN</tspan>\n",
        "</text>\n",
        "\n",
+       "<text class=\"displacy-token\" fill=\"currentColor\" text-anchor=\"middle\" y=\"247.0\">\n",
+       "    <tspan class=\"displacy-word\" fill=\"currentColor\" x=\"250\">although</tspan>\n",
+       "    <tspan class=\"displacy-tag\" dy=\"2em\" fill=\"currentColor\" x=\"250\">SCONJ</tspan>\n",
        "</text>\n",
        "\n",
+       "<text class=\"displacy-token\" fill=\"currentColor\" text-anchor=\"middle\" y=\"247.0\">\n",
+       "    <tspan class=\"displacy-word\" fill=\"currentColor\" x=\"350\">she</tspan>\n",
+       "    <tspan class=\"displacy-tag\" dy=\"2em\" fill=\"currentColor\" x=\"350\">PRON</tspan>\n",
        "</text>\n",
        "\n",
+       "<text class=\"displacy-token\" fill=\"currentColor\" text-anchor=\"middle\" y=\"247.0\">\n",
+       "    <tspan class=\"displacy-word\" fill=\"currentColor\" x=\"450\">had</tspan>\n",
+       "    <tspan class=\"displacy-tag\" dy=\"2em\" fill=\"currentColor\" x=\"450\">VERB</tspan>\n",
        "</text>\n",
        "\n",
+       "<text class=\"displacy-token\" fill=\"currentColor\" text-anchor=\"middle\" y=\"247.0\">\n",
+       "    <tspan class=\"displacy-word\" fill=\"currentColor\" x=\"550\">doubts,</tspan>\n",
+       "    <tspan class=\"displacy-tag\" dy=\"2em\" fill=\"currentColor\" x=\"550\">NOUN</tspan>\n",
        "</text>\n",
        "\n",
+       "<text class=\"displacy-token\" fill=\"currentColor\" text-anchor=\"middle\" y=\"247.0\">\n",
+       "    <tspan class=\"displacy-word\" fill=\"currentColor\" x=\"650\">approved</tspan>\n",
+       "    <tspan class=\"displacy-tag\" dy=\"2em\" fill=\"currentColor\" x=\"650\">VERB</tspan>\n",
        "</text>\n",
        "\n",
+       "<text class=\"displacy-token\" fill=\"currentColor\" text-anchor=\"middle\" y=\"247.0\">\n",
+       "    <tspan class=\"displacy-word\" fill=\"currentColor\" x=\"750\">the</tspan>\n",
+       "    <tspan class=\"displacy-tag\" dy=\"2em\" fill=\"currentColor\" x=\"750\">DET</tspan>\n",
        "</text>\n",
        "\n",
+       "<text class=\"displacy-token\" fill=\"currentColor\" text-anchor=\"middle\" y=\"247.0\">\n",
+       "    <tspan class=\"displacy-word\" fill=\"currentColor\" x=\"850\">proposal.</tspan>\n",
+       "    <tspan class=\"displacy-tag\" dy=\"2em\" fill=\"currentColor\" x=\"850\">NOUN</tspan>\n",
+       "</text>\n",
+       "\n",
+       "<g class=\"displacy-arrow\">\n",
+       "    <path class=\"displacy-arc\" id=\"arrow-b935f75a06f14438a922ac30e5ab8f72-0-0\" stroke-width=\"2px\" d=\"M62,202.0 62,185.33333333333334 141.0,185.33333333333334 141.0,202.0\" fill=\"none\" stroke=\"currentColor\"/>\n",
+       "    <text dy=\"1.25em\" style=\"font-size: 0.8em; letter-spacing: 1px\">\n",
+       "        <textPath xlink:href=\"#arrow-b935f75a06f14438a922ac30e5ab8f72-0-0\" class=\"displacy-label\" startOffset=\"50%\" side=\"left\" fill=\"currentColor\" text-anchor=\"middle\">det</textPath>\n",
+       "    </text>\n",
+       "    <path class=\"displacy-arrowhead\" d=\"M62,204.0 L58,196.0 66,196.0\" fill=\"currentColor\"/>\n",
+       "</g>\n",
+       "\n",
        "<g class=\"displacy-arrow\">\n",
+       "    <path class=\"displacy-arc\" id=\"arrow-b935f75a06f14438a922ac30e5ab8f72-0-1\" stroke-width=\"2px\" d=\"M162,202.0 162,135.33333333333331 650.0,135.33333333333331 650.0,202.0\" fill=\"none\" stroke=\"currentColor\"/>\n",
        "    <text dy=\"1.25em\" style=\"font-size: 0.8em; letter-spacing: 1px\">\n",
+       "        <textPath xlink:href=\"#arrow-b935f75a06f14438a922ac30e5ab8f72-0-1\" class=\"displacy-label\" startOffset=\"50%\" side=\"left\" fill=\"currentColor\" text-anchor=\"middle\">subj</textPath>\n",
        "    </text>\n",
+       "    <path class=\"displacy-arrowhead\" d=\"M162,204.0 L158,196.0 166,196.0\" fill=\"currentColor\"/>\n",
        "</g>\n",
        "\n",
        "<g class=\"displacy-arrow\">\n",
+       "    <path class=\"displacy-arc\" id=\"arrow-b935f75a06f14438a922ac30e5ab8f72-0-2\" stroke-width=\"2px\" d=\"M262,202.0 262,152.0 647.0,152.0 647.0,202.0\" fill=\"none\" stroke=\"currentColor\"/>\n",
        "    <text dy=\"1.25em\" style=\"font-size: 0.8em; letter-spacing: 1px\">\n",
+       "        <textPath xlink:href=\"#arrow-b935f75a06f14438a922ac30e5ab8f72-0-2\" class=\"displacy-label\" startOffset=\"50%\" side=\"left\" fill=\"currentColor\" text-anchor=\"middle\">mod</textPath>\n",
        "    </text>\n",
+       "    <path class=\"displacy-arrowhead\" d=\"M262,204.0 L258,196.0 266,196.0\" fill=\"currentColor\"/>\n",
        "</g>\n",
        "\n",
        "<g class=\"displacy-arrow\">\n",
+       "    <path class=\"displacy-arc\" id=\"arrow-b935f75a06f14438a922ac30e5ab8f72-0-3\" stroke-width=\"2px\" d=\"M362,202.0 362,185.33333333333334 441.0,185.33333333333334 441.0,202.0\" fill=\"none\" stroke=\"currentColor\"/>\n",
        "    <text dy=\"1.25em\" style=\"font-size: 0.8em; letter-spacing: 1px\">\n",
+       "        <textPath xlink:href=\"#arrow-b935f75a06f14438a922ac30e5ab8f72-0-3\" class=\"displacy-label\" startOffset=\"50%\" side=\"left\" fill=\"currentColor\" text-anchor=\"middle\">subj</textPath>\n",
        "    </text>\n",
+       "    <path class=\"displacy-arrowhead\" d=\"M362,204.0 L358,196.0 366,196.0\" fill=\"currentColor\"/>\n",
        "</g>\n",
        "\n",
        "<g class=\"displacy-arrow\">\n",
+       "    <path class=\"displacy-arc\" id=\"arrow-b935f75a06f14438a922ac30e5ab8f72-0-4\" stroke-width=\"2px\" d=\"M262,202.0 262,168.66666666666666 444.0,168.66666666666666 444.0,202.0\" fill=\"none\" stroke=\"currentColor\"/>\n",
        "    <text dy=\"1.25em\" style=\"font-size: 0.8em; letter-spacing: 1px\">\n",
+       "        <textPath xlink:href=\"#arrow-b935f75a06f14438a922ac30e5ab8f72-0-4\" class=\"displacy-label\" startOffset=\"50%\" side=\"left\" fill=\"currentColor\" text-anchor=\"middle\">comp</textPath>\n",
        "    </text>\n",
+       "    <path class=\"displacy-arrowhead\" d=\"M444.0,204.0 L448.0,196.0 440.0,196.0\" fill=\"currentColor\"/>\n",
        "</g>\n",
        "\n",
        "<g class=\"displacy-arrow\">\n",
+       "    <path class=\"displacy-arc\" id=\"arrow-b935f75a06f14438a922ac30e5ab8f72-0-5\" stroke-width=\"2px\" d=\"M462,202.0 462,185.33333333333334 541.0,185.33333333333334 541.0,202.0\" fill=\"none\" stroke=\"currentColor\"/>\n",
        "    <text dy=\"1.25em\" style=\"font-size: 0.8em; letter-spacing: 1px\">\n",
+       "        <textPath xlink:href=\"#arrow-b935f75a06f14438a922ac30e5ab8f72-0-5\" class=\"displacy-label\" startOffset=\"50%\" side=\"left\" fill=\"currentColor\" text-anchor=\"middle\">comp</textPath>\n",
        "    </text>\n",
+       "    <path class=\"displacy-arrowhead\" d=\"M541.0,204.0 L545.0,196.0 537.0,196.0\" fill=\"currentColor\"/>\n",
        "</g>\n",
        "\n",
        "<g class=\"displacy-arrow\">\n",
+       "    <path class=\"displacy-arc\" id=\"arrow-b935f75a06f14438a922ac30e5ab8f72-0-6\" stroke-width=\"2px\" d=\"M762,202.0 762,185.33333333333334 841.0,185.33333333333334 841.0,202.0\" fill=\"none\" stroke=\"currentColor\"/>\n",
        "    <text dy=\"1.25em\" style=\"font-size: 0.8em; letter-spacing: 1px\">\n",
+       "        <textPath xlink:href=\"#arrow-b935f75a06f14438a922ac30e5ab8f72-0-6\" class=\"displacy-label\" startOffset=\"50%\" side=\"left\" fill=\"currentColor\" text-anchor=\"middle\">det</textPath>\n",
        "    </text>\n",
+       "    <path class=\"displacy-arrowhead\" d=\"M762,204.0 L758,196.0 766,196.0\" fill=\"currentColor\"/>\n",
        "</g>\n",
        "\n",
        "<g class=\"displacy-arrow\">\n",
+       "    <path class=\"displacy-arc\" id=\"arrow-b935f75a06f14438a922ac30e5ab8f72-0-7\" stroke-width=\"2px\" d=\"M662,202.0 662,168.66666666666666 844.0,168.66666666666666 844.0,202.0\" fill=\"none\" stroke=\"currentColor\"/>\n",
        "    <text dy=\"1.25em\" style=\"font-size: 0.8em; letter-spacing: 1px\">\n",
+       "        <textPath xlink:href=\"#arrow-b935f75a06f14438a922ac30e5ab8f72-0-7\" class=\"displacy-label\" startOffset=\"50%\" side=\"left\" fill=\"currentColor\" text-anchor=\"middle\">comp</textPath>\n",
        "    </text>\n",
+       "    <path class=\"displacy-arrowhead\" d=\"M844.0,204.0 L848.0,196.0 840.0,196.0\" fill=\"currentColor\"/>\n",
        "</g>\n",
        "</svg></span>"
       ],
     }
    ],
    "source": [
+    "doc = ssudify(nlp(\"The manager, although she had doubts, approved the proposal.\"))\n",
     "# Since this is an interactive Jupyter environment, we can use displacy.render here\n",
+    "displacy.render(doc, style='dep', options={'compact': True, 'font': \"\", 'distance': 100})\n",
+    "# with open(\"sample_parse.svg\", \"w\", encoding=\"utf-8\") as f:\n",
+    "#     f.write(svg)"
    ]
   },
   {

main.py CHANGED Viewed

@@ -7,52 +7,97 @@ nlp = spacy.load("en_core_web_sm")
 relations = {
     "subj": ["nsubj", "nsubjpass", "csubj", "csubjpass", "expl"],
-    "comp": ["dobj", "dative", "attr", "oprd", "pobj", "aux", "auxpass", "mark", "case", "ccomp", "xcomp", "acomp"],
     "mod": ["agent", "advmod", "advcl", "relcl", "npmod", "npadvmod", "prt"],
     "udep": ["acl", "amod", "nmod", "poss", "nummod", "prep"],
 }
-def ssudify(doc):
     for token in doc:
         to_reverse = [token]
         for child in token.children:
-            if (child.dep_ in ["aux", "auxpass", "mark", "case"]) or (child.dep_ == "advmod" and child.pos_ == "SCONJ"):
                 to_reverse.append(child)
-        to_reverse.sort(key = lambda x: abs(x.i - token.i))
         if len(to_reverse) > 1:
             for i in range(1, len(to_reverse)):
                 if to_reverse[i].dep_ in ["aux", "auxpass"]:
-                    for child in to_reverse[i-1].children:
-                        if child.dep_ in relations["subj"] + relations["mod"] + ["conj", "cc"]:
                             child.head = to_reverse[i]
-                to_reverse[i].head = to_reverse[i-1].head if to_reverse[i-1].head != to_reverse[i-1] else to_reverse[i]
-                to_reverse[i].dep_ = to_reverse[i-1].dep_
-                to_reverse[i-1].head = to_reverse[i]
-                to_reverse[i-1].dep_ = "comp"
     for token in doc:
-        if token.dep_ == "dep": token.dep_ = "unknown"
-        if token.dep_ == "prep" and token.head.pos_ in ["VERB", "AUX"] and \
-           token.i < token.head.i and token.head.dep_ not in relations["mod"]:
             token.dep_ = "mod"
-        if token.dep_ == "prep" and token.head.pos_ in ["VERB", "AUX"] and \
-           ((len(list(token.head.rights)) >= 1 and token == list(token.head.rights)[0]) or
-            (len(list(token.head.rights)) >= 2 and
-             list(token.head.rights)[0].dep_ == "dobj" and token == list(token.head.rights)[1])):
             token.dep_ = "comp"
-        if token.dep_ == "ccomp" and any(sibling.dep_ in relations["comp"]
-                                         for sibling in token.head.rights if sibling.i < token.i):
             token.dep_ = "mod"
         dobjs = [child for child in token.children if child.dep_ == "dobj"]
         if len(dobjs) > 1:
             for i in range(1, len(dobjs)):
-                dobjs[i].head = dobjs[i-1]
                 dobjs[i].dep_ = "appos"
     for token in doc:
         for rel in relations.keys():
-            if token.dep_ in relations[rel]: token.dep_ = rel
     for token in doc:
-        subjects = sorted([child for child in token.children if child.dep_ == "subj"], key = lambda x: abs(x.i - token.i))
         if len(subjects) > 1:
             for s in subjects[1:]:
                 s.dep_ = "comp"
@@ -63,66 +108,117 @@ def ssudify(doc):
                 if child.dep_ in ["comp", "udep"] and token.dep_ != "mod":
                     child.dep_ = "mod"
     for token in doc:
-        if any(t.text in [";", ":"] for t in doc
-               if ((token.i < t.i < token.head.i and not
-                    (any(p.text == "(" for p in doc if token.i < p.i < t.i) and
-                     any(p.text == ")" for p in doc if t.i < p.i < token.head.i))) or
-                   (token.head.i < t.i < token.i and not
-                    (any(p.text == "(" for p in doc if token.head.i < p.i < t.i) and
-                     any(p.text == ")" for p in doc if t.i < p.i < token.i)))) and token.pos_ != "PUNCT"):
             token.head = token
             token.dep_ = "root"
         if token.pos_ in ["VERB", "AUX"]:
-            core_children = [child for child in token.children if child.dep_ in ["subj", "comp", "udep"]]
             core_children.append(token)
             core_children.sort(key=lambda x: x.i)
             right_edge = [t for t in core_children[-1].subtree if t.pos_ != "PUNCT"][-1]
             if right_edge.i < len(doc) - 1:
-                if right_edge.text == "," or doc[right_edge.i+1].text == ",":
-                    for child in [child for child in token.children if child.i > right_edge.i and child.dep_ == "conj"]:
                         child.dep_ = "mod"
-        if token.pos_ in ["VERB", "AUX"] and token.head.pos_ == "NOUN" and token.dep_ == "udep":
             token.dep_ = "mod"
     return doc
 def flyover(token):
-    if token.dep_ in ["subj", "comp", "udep", "conj"]:
-        dep_distance = abs(token.i - token.head.i)
         if token.head.i < token.i:
-            return (token.doc[token.head.i+1:token.i], dep_distance - 1)
         elif token.head.i > token.i:
-            return (token.doc[token.i+1:token.head.i], dep_distance - 1)
     else:
-        return (token.doc[token.i:token.i], 0)
 def get_fluff(doc):
     flyovers = list(map(flyover, doc))
     flyovers = [f for f in flyovers if len(f[0]) > 0]
-    flyovers = [f1 for f1 in flyovers if len([f2 for f2 in flyovers if
-                                              (f2[0][-1].i > f1[0][0].i >= f2[0][0].i or f2[0][0].i < f1[0][-1].i <= f2[0][-1].i) and
-                                              (len(f1[0]) < len(f2[0]) or f1[1] < f2[1])]) == 0 and len(f1[0]) > 2]
     flyovers = sorted(flyovers, key=lambda x: x[0][0].i)
     interstices = []
     for i in range(len(flyovers)):
         if i == 0:
             if flyovers[0][0][0].i > 0:
-                interstices.append((doc[0:flyovers[0][0][0].i], 0))
         else:
-            if flyovers[i][0][0].i > flyovers[i-1][0][-1].i + 1:
-                interstices.append((doc[flyovers[i-1][0][-1].i+1:flyovers[i][0][0].i], 0))
             # elif flyovers[i][1] == flyovers[i-1][1]:
             #     flyovers[i] = (doc[flyovers[i-1][0][0].i:flyovers[i][0][-1].i+1], flyovers[i][1])
             #     flyovers[i-1] = (doc[flyovers[i-1][0][0].i:flyovers[i-1][0][0].i], flyovers[i-1][1])
     if len(flyovers) > 0:
         if flyovers[-1][0][-1].i < doc[-1].i:
-            interstices.append((doc[flyovers[-1][0][-1].i+1:], 0))
     else:
         interstices.append((doc, 0))
     flyovers = [f for f in flyovers if len(f[0]) > 0]
     return sorted(flyovers + interstices, key=lambda x: x[0][0].i)
 from fasthtml_hf import setup_hf_backup
 from fasthtml.common import *
 import re
@@ -134,31 +230,181 @@ app, rt = fast_app(pico=True)
 def index():
     page = Div(
         Form(hx_post=send, hx_target="#output", hx_swap="outerHTML")(
-            Div(Button("Check", style="margin-bottom: 1rem"),
-                Textarea(name="text", style="height: calc(100vh - 11rem)"))
             ),
         Div(
-            Div(Small(Em("Highlighted text segments can be shortened or reordered to improve readability. The stronger the highlight, the more the segment burdens the reader’s memory.")),
-                cls="overflow-auto", style="height: 4rem; text-wrap: balance; padding: 0rem 1rem"),
-            Div(id="output", style="padding: 1rem; padding-bottom: calc(1rem - 5px)")
         ),
-        cls="grid"
     )
-    return Titled('Readability feedback', page)
 @app.post
-def send(text:str):
     paragraphs = re.sub(r"[^\S\r\n]+", " ", text).split("\r\n\r\n")
-    docs = [ssudify(nlp(para)) for para in paragraphs]
     annot_paras = [get_fluff(doc) for doc in docs]
-    return Div(*[P(*[Span(Span(a[0], style=f"background: light-dark(rgba(237, 201, 241, {a[1]/15}), rgba(182, 69, 205, {a[1]/15}))"),
-                          Span(" ")) for a in annot_para],
-                   style="margin-bottom: 1.5em")
-                 for annot_para in annot_paras[:-1]],
-               P(*[Span(Span(a[0], style=f"background: light-dark(rgba(237, 201, 241, {a[1]/15}), rgba(182, 69, 205, {a[1]/15}))"),
-                        Span(" ")) for a in annot_paras[-1]],
-                 style="margin-bottom: 0em"),
-               id="output", cls="overflow-auto", style="height: calc(100vh - 11rem); padding: 1rem; padding-bottom: calc(1rem - 5px)")
 setup_hf_backup(app)
 serve()

 relations = {
     "subj": ["nsubj", "nsubjpass", "csubj", "csubjpass", "expl"],
+    "comp": [
+        "dobj",
+        "dative",
+        "attr",
+        "oprd",
+        "pobj",
+        "aux",
+        "auxpass",
+        "mark",
+        "case",
+        "ccomp",
+        "xcomp",
+        "acomp",
+    ],
     "mod": ["agent", "advmod", "advcl", "relcl", "npmod", "npadvmod", "prt"],
     "udep": ["acl", "amod", "nmod", "poss", "nummod", "prep"],
 }
+def sudify(doc):
     for token in doc:
         to_reverse = [token]
         for child in token.children:
+            if (child.dep_ in ["aux", "auxpass", "mark", "case"]) or (
+                child.dep_ == "advmod" and child.pos_ == "SCONJ"
+            ):
                 to_reverse.append(child)
+        to_reverse.sort(key=lambda x: abs(x.i - token.i))
         if len(to_reverse) > 1:
             for i in range(1, len(to_reverse)):
                 if to_reverse[i].dep_ in ["aux", "auxpass"]:
+                    for child in to_reverse[i - 1].children:
+                        if child.dep_ in relations["subj"] + relations["mod"] + [
+                            "conj",
+                            "cc",
+                        ]:
                             child.head = to_reverse[i]
+                to_reverse[i].head = (
+                    to_reverse[i - 1].head
+                    if to_reverse[i - 1].head != to_reverse[i - 1]
+                    else to_reverse[i]
+                )
+                to_reverse[i].dep_ = to_reverse[i - 1].dep_
+                to_reverse[i - 1].head = to_reverse[i]
+                to_reverse[i - 1].dep_ = "comp"
     for token in doc:
+        if token.dep_ == "dep":
+            token.dep_ = "unknown"
+        if (
+            token.dep_ == "prep"
+            and token.head.pos_ in ["VERB", "AUX"]
+            and token.i < token.head.i
+            and token.head.dep_ not in relations["mod"]
+        ):
             token.dep_ = "mod"
+        if (
+            token.dep_ == "prep"
+            and token.head.pos_ in ["VERB", "AUX"]
+            and (
+                (
+                    len(list(token.head.rights)) >= 1
+                    and token == list(token.head.rights)[0]
+                )
+                or (
+                    len(list(token.head.rights)) >= 2
+                    and list(token.head.rights)[0].dep_ == "dobj"
+                    and token == list(token.head.rights)[1]
+                )
+            )
+        ):
             token.dep_ = "comp"
+        if token.dep_ == "ccomp" and any(
+            sibling.dep_ in relations["comp"]
+            for sibling in token.head.rights
+            if sibling.i < token.i
+        ):
             token.dep_ = "mod"
         dobjs = [child for child in token.children if child.dep_ == "dobj"]
         if len(dobjs) > 1:
             for i in range(1, len(dobjs)):
+                dobjs[i].head = dobjs[i - 1]
                 dobjs[i].dep_ = "appos"
     for token in doc:
         for rel in relations.keys():
+            if token.dep_ in relations[rel]:
+                token.dep_ = rel
     for token in doc:
+        subjects = sorted(
+            [child for child in token.children if child.dep_ == "subj"],
+            key=lambda x: abs(x.i - token.i),
+        )
         if len(subjects) > 1:
             for s in subjects[1:]:
                 s.dep_ = "comp"
                 if child.dep_ in ["comp", "udep"] and token.dep_ != "mod":
                     child.dep_ = "mod"
     for token in doc:
+        if any(
+            t.text in [";", ":"]
+            for t in doc
+            if (
+                (
+                    token.i < t.i < token.head.i
+                    and not (
+                        any(p.text == "(" for p in doc if token.i < p.i < t.i)
+                        and any(p.text == ")" for p in doc if t.i < p.i < token.head.i)
+                    )
+                )
+                or (
+                    token.head.i < t.i < token.i
+                    and not (
+                        any(p.text == "(" for p in doc if token.head.i < p.i < t.i)
+                        and any(p.text == ")" for p in doc if t.i < p.i < token.i)
+                    )
+                )
+            )
+            and token.pos_ != "PUNCT"
+        ):
             token.head = token
             token.dep_ = "root"
         if token.pos_ in ["VERB", "AUX"]:
+            core_children = [
+                child
+                for child in token.children
+                if child.dep_ in ["subj", "comp", "udep"]
+            ]
             core_children.append(token)
             core_children.sort(key=lambda x: x.i)
             right_edge = [t for t in core_children[-1].subtree if t.pos_ != "PUNCT"][-1]
             if right_edge.i < len(doc) - 1:
+                if right_edge.text == "," or doc[right_edge.i + 1].text == ",":
+                    for child in [
+                        child
+                        for child in token.children
+                        if child.i > right_edge.i and child.dep_ == "conj"
+                    ]:
                         child.dep_ = "mod"
+        if (
+            token.pos_ in ["VERB", "AUX"]
+            and token.head.pos_ == "NOUN"
+            and token.dep_ == "udep"
+        ):
             token.dep_ = "mod"
     return doc
 def flyover(token):
+    if token.dep_ in ["subj", "comp"]:
+        dep_distance = len(
+            [
+                t
+                for t in token.doc[
+                    min(token.i, token.head.i) + 1 : max(token.i, token.head.i)
+                ]
+                if len(list(t.children)) > 0
+            ]
+        )
         if token.head.i < token.i:
+            return (token.doc[token.head.i + 1 : token.i], dep_distance)
         elif token.head.i > token.i:
+            return (token.doc[token.i + 1 : token.head.i], dep_distance)
     else:
+        return (token.doc[token.i : token.i], 0)
 def get_fluff(doc):
     flyovers = list(map(flyover, doc))
     flyovers = [f for f in flyovers if len(f[0]) > 0]
+    flyovers = [
+        f1
+        for f1 in flyovers
+        if len(
+            [
+                f2
+                for f2 in flyovers
+                if (
+                    f2[0][-1].i > f1[0][0].i >= f2[0][0].i
+                    or f2[0][0].i < f1[0][-1].i <= f2[0][-1].i
+                )
+                and (len(f1[0]) < len(f2[0]) or f1[1] < f2[1])
+            ]
+        )
+        == 0
+        and f1[1] > 0
+    ]
     flyovers = sorted(flyovers, key=lambda x: x[0][0].i)
     interstices = []
     for i in range(len(flyovers)):
         if i == 0:
             if flyovers[0][0][0].i > 0:
+                interstices.append((doc[0 : flyovers[0][0][0].i], 0))
         else:
+            if flyovers[i][0][0].i > flyovers[i - 1][0][-1].i + 1:
+                interstices.append(
+                    (doc[flyovers[i - 1][0][-1].i + 1 : flyovers[i][0][0].i], 0)
+                )
             # elif flyovers[i][1] == flyovers[i-1][1]:
             #     flyovers[i] = (doc[flyovers[i-1][0][0].i:flyovers[i][0][-1].i+1], flyovers[i][1])
             #     flyovers[i-1] = (doc[flyovers[i-1][0][0].i:flyovers[i-1][0][0].i], flyovers[i-1][1])
     if len(flyovers) > 0:
         if flyovers[-1][0][-1].i < doc[-1].i:
+            interstices.append((doc[flyovers[-1][0][-1].i + 1 :], 0))
     else:
         interstices.append((doc, 0))
     flyovers = [f for f in flyovers if len(f[0]) > 0]
     return sorted(flyovers + interstices, key=lambda x: x[0][0].i)
 from fasthtml_hf import setup_hf_backup
 from fasthtml.common import *
 import re
 def index():
     page = Div(
         Form(hx_post=send, hx_target="#output", hx_swap="outerHTML")(
+            Div(
+                Span(
+                    Button("Check"),
+                    A("How this works", href="/about"),
+                    style="margin-bottom: 1rem; display: flex; gap: 1rem; align-items: center",
+                ),
+                Textarea(name="text", style="height: calc(100vh - 11rem)"),
+            )
+        ),
+        Div(
+            Div(
+                Em(
+                    "Highlighted text segments can be shortened or reordered to improve readability."
+                ),
+                cls="overflow-auto",
+                style="height: 4rem; text-wrap: balance; padding: 0rem 1rem",
             ),
+            Div(id="output", style="padding: 1rem; padding-bottom: calc(1rem - 5px)"),
+        ),
+        cls="grid",
+    )
+    return Titled("Readability feedback", page)
+@app.get
+def about():
+    content = Div(
+        H2("How this works"),
+        P(
+            "One of the keys to writing clearly is to ",
+            Em("keep related words close together"),
+            ". Don't, if you want to be understood, insert any long asides! (See what I did there?) This tool helps you visually identify places in your writing where two related words are interrupted by an aside, which you can then either shorten or move to a different position in the sentence.",
+        ),
+        P(
+            "But how do we identify words in a sentence that are related to each other? We can do this using a technique from natural language processing called ",
+            Em("dependency parsing"),
+            ". For example, we can take a sentence like ",
+            Var("The manager approved the proposal although she had doubts"),
+            ", and produce a diagram like the following:",
+        ),
         Div(
+            NotStr(
+                open("sample_parse.svg", "r").read(),
+            ),
+            style="margin-top: 1rem; margin-bottom: 1rem; width: 100%; overflow-x: auto",
         ),
+        P(
+            "This tells us, for example, that ",
+            Var("manager"),
+            " (or ",
+            Var("the manager"),
+            ") is the subject of ",
+            Var("approved"),
+            ' (since she is the "main character" of the event of approving); that ',
+            Var("proposal"),
+            " (or ",
+            Var("the proposal"),
+            ") is a complement of ",
+            Var("approved"),
+            " (since you cannot imagine an act of approving without imagining the thing that is being approved—in this case, the proposal); and that ",
+            Var("although"),
+            " (or ",
+            Var("although she had doubts"),
+            ") is a modifier of ",
+            Var("approved"),
+            " (since it gives us the context of the manager's approval). Naturally, subjects and complements are more closely related to the verb than modifiers are, and so we ignore modifiers when identifying related words that should be kept close together. We can see that in this sentence, the subject and the complement are right next to the verb, and so the sentence is easy to read.",
+        ),
+        P("Now let us see what happens when we reorder the sentence:"),
+        Div(
+            NotStr(
+                open("sample_parse_2.svg", "r").read(),
+            ),
+            style="margin-top: 1rem; margin-bottom: 1rem; width: 100%; overflow-x: auto",
+        ),
+        P(
+            "Here, we see that the modifier ",
+            Var("although she had doubts"),
+            " now interrupts the subject relation between ",
+            Var("the manager"),
+            " and ",
+            Var("approved"),
+            ". And indeed, you can see that this sentence is harder to read than the first one.",
+        ),
+        H2("Technical details"),
+        P(
+            "The inspiration for this tool is the idea of ",
+            Em("Dependency Length Minimisation"),
+            " (DLM) in psycholinguistics, which posits that human languages tend to minimise the distance between syntactically related words to reduce cognitive load during sentence processing. For more information on DLM, see ",
+            A(
+                "Futrell et al. (2015)",
+                href="https://pmc.ncbi.nlm.nih.gov/articles/PMC4547262/",
+            ),
+            ". For evidence that dependency length predicts reading times in English, see e.g. ",
+            A(
+                "Bartek et al. (2011)",
+                href="https://pubmed.ncbi.nlm.nih.gov/21707210/",
+            ),
+            ".",
+        ),
+        P(
+            "I have used the ",
+            A("spaCy", href="https://spacy.io/"),
+            " library's ",
+            Var("en_core_web_sm"),
+            " model to perform dependency parsing, adjusting the results to bring them in line with the ",
+            A(
+                "Surface Syntactic Universal Dependencies (SUD)",
+                href="https://surfacesyntacticud.org",
+            ),
+            " framework, which is more consistent with linguistic theories. For any dependency arc that exhibits the ",
+            Var("subj"),
+            " (subject) or ",
+            Var("comp"),
+            " (complement) relation, the words lying between the head and the dependent are highlighted with an opacity proportional to the number of heads (i.e. words with at least one dependent) in that interval. This follows the revised definition of dependency length proposed by ",
+            A(
+                "Yadav et al. (2022)",
+                href="https://direct.mit.edu/opmi/article/doi/10.1162/opmi_a_00060/112598/A-Reappraisal-of-Dependency-Length-Minimization-as",
+            ),
+            ".",
+        ),
+        P(
+            "The web app itself was built using the ",
+            A("FastHTML", href="https://fasthtml.org/"),
+            " framework, which I learned about in the ",
+            A("Solve It With Code", href="https://solve.it.com/"),
+            " course from ",
+            A("Answer.AI", href="https://www.answer.ai/"),
+            ". The entire development took two days (starting on December 26, 2025), with an extra day for handling various edge cases. This page was added on January 4, 2026.",
+        ),
+        A("Back to main page", href="/"),
+        style="padding-bottom: 1rem; padding-top: 1rem; max-width: 800px; margin: auto",
     )
+    return Titled("Readability feedback", content)
 @app.post
+def send(text: str):
     paragraphs = re.sub(r"[^\S\r\n]+", " ", text).split("\r\n\r\n")
+    docs = [sudify(nlp(para)) for para in paragraphs]
     annot_paras = [get_fluff(doc) for doc in docs]
+    return Div(
+        *[
+            P(
+                *[
+                    Span(
+                        Span(
+                            a[0],
+                            style=f"background: light-dark(rgba(237, 201, 241, {a[1]/5}), rgba(182, 69, 205, {a[1]/5}))",
+                        ),
+                        Span(" "),
+                    )
+                    for a in annot_para
+                ],
+                style="margin-bottom: 1.5em",
+            )
+            for annot_para in annot_paras[:-1]
+        ],
+        P(
+            *[
+                Span(
+                    Span(
+                        a[0],
+                        style=f"background: light-dark(rgba(237, 201, 241, {a[1]/5}), rgba(182, 69, 205, {a[1]/5}))",
+                    ),
+                    Span(" "),
+                )
+                for a in annot_paras[-1]
+            ],
+            style="margin-bottom: 0em",
+        ),
+        id="output",
+        cls="overflow-auto",
+        style="height: calc(100vh - 11rem); padding: 1rem; padding-bottom: calc(1rem - 5px)",
+    )
 setup_hf_backup(app)
 serve()

sample_parse.svg ADDED Viewed

sample_parse_2.svg ADDED Viewed