syhrlhyn
/

aibys-tokenizer

Model card Files Files and versions

syhrlhyn commited on 4 days ago

Commit

9bd3418

·

verified ·

1 Parent(s): e9a0d1c

Delete tes.py

Files changed (1) hide show

tes.py +0 -46

tes.py DELETED Viewed

@@ -1,46 +0,0 @@
-import sentencepiece as spm
-import os
-def interactive_test(model_path="aibys.model"):
-    if not os.path.exists(model_path):
-        print(f"❌ File model tidak ditemukan di: {model_path}")
-        return
-    # Load model
-    sp = spm.SentencePieceProcessor()
-    sp.load(model_path)
-    print("="*60)
-    print("        🤖 AIBYS TOKENIZER INTERACTIVE TESTER")
-    print("          Type 'exit' atau 'keluar' untuk stop")
-    print("="*60)
-    print(f"Vocab Size: {sp.vocab_size()}")
-    while True:
-        print("\n" + "-"*50)
-        text = input("📝 Masukkan kalimat: ")
-        if text.lower() in ['exit', 'keluar', 'q']:
-            print("👋 Sampai jumpa, Syahril!")
-            break
-        if not text.strip():
-            continue
-        # Proses Tokenisasi
-        tokens = sp.encode_as_pieces(text)
-        ids = sp.encode_as_ids(text)
-        print(f"\n📊 Hasil Analisis:")
-        print(f"   Input      : {text}")
-        print(f"   Tokens     : {tokens}")
-        print(f"   Token IDs  : {ids}")
-        print(f"   Count      : {len(ids)} Token")
-        # Cek Efisiensi (Estimasi: makin sedikit token vs jumlah kata, makin bagus)
-        kata_count = len(text.split())
-        efisiensi = "SANGAT BAGUS" if len(ids) <= kata_count + 2 else "STANDAR"
-        print(f"   Efisiensi  : {efisiensi}")
-if __name__ == "__main__":
-    interactive_test()