Total characters in text: """ outputString = outputString + str(txtLen) + """

Token count: """ outputString = outputString + str(numTokens) + """

""" for strToken in strTokens: colorNum = i % len(color_list) chosencolor = color_list[colorNum] outputString = outputString + " " + strToken + "" i = i + 1 outputString = outputString + """

""" return outputString def tokenizeText(inputText): tokens, strTokens = getTokens(inputText) return(getColoredText(inputText, tokens, strTokens)) title = "Tokenizer for Hindi language from Scratch" description = "Created Hindi Tokenizer from Scratch" examples = [ "चिन्नयरसाल में भारत के आन्ध्रप्रदेश राज्य के अन्तर्गत के कडप जिले का एक गाँव है।", "करासीबूंगा, काफलीगैर तहसील में भारत के उत्तराखण्ड राज्य के अन्तर्गत कुमाऊँ मण्डल के बागेश्वर जिले का एक गाँव है।", "इस वाक्य का अनुवाद गूगल100 ट्रांसलेट द्वारा किया जा रहा है।😅", "कैफ़ भोपाली ने कई हिंदी फिल्मों में गीत लिखे, किन्तु 1972 में बनी पाक़ीज़ा उनकी यादगार फिल्म रही।", "छाया गठबंधन की हार के बाद विशेष Yamato बी दा बॉल्स की तलाश में है स्ट्राइक मदपान, जो सितारों शूटिंग से उत्पन्न कहा जाता है। रहस्यमय Haja के साथ एक लड़ाई के बाद और उसके स्ट्राइक फटका, ड्राइव शूटिंग प्राप्त करने, Yamato तो Gunnos, एक रंगरूट बी DaPlayer से मुलाकात की। वह अपने ही हड़ताल को Yamato पुराने मित्रों और प्रतिद्वंद्वियों के साथ विजेता प्रतियोगिता में भाग लेने शॉट मिल गया। लेकिन कुछ नहीं किया वे पता है।.. .. एक भयानक बुराई करने के लिए जोखिम में एक बार फिर बी दा विश्व डाल बारे में है।", "In 2019 google introduced BERT- Bidirectional Encoder Representations from Transformers (paper), which is designed to pre-train a language model from a vast corpus of rew text. What distinguishes it from existing word-embedding models like Word2vec, ELMo etc. is that it is a truly bidirectional model, meaning it is trained on unlabeled text by jointly conditioning both left and right context simultaneously." ] demo = gr.Interface( tokenizeText, inputs = [ gr.Textbox(), ], outputs = [ gr.HTML(), ], title = title, description = description, examples = examples, cache_examples=False ) demo.launch()