Upload safe/flexitok--bpe_ell_Grek_8000_overlap.json with huggingface_hub
Browse files
safe/flexitok--bpe_ell_Grek_8000_overlap.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"1": {"ratio_to_total_tokens": 0.899125, "expected_training_ratio_in_superset": 0.04281547619047619, "num_tokens": 7193}, "2": {"ratio_to_total_tokens": 0.000375, "expected_training_ratio_in_superset": 3.571428571428571e-05, "num_tokens": 3}, "3": {"ratio_to_total_tokens": 0.00025, "expected_training_ratio_in_superset": 3.571428571428571e-05, "num_tokens": 2}, "4": {"ratio_to_total_tokens": 0.000625, "expected_training_ratio_in_superset": 0.00011904761904761905, "num_tokens": 5}, "5": {"ratio_to_total_tokens": 0.0005, "expected_training_ratio_in_superset": 0.00011904761904761905, "num_tokens": 4}, "6": {"ratio_to_total_tokens": 0.000375, "expected_training_ratio_in_superset": 0.00010714285714285714, "num_tokens": 3}, "7": {"ratio_to_total_tokens": 0.000875, "expected_training_ratio_in_superset": 0.00029166666666666664, "num_tokens": 7}, "8": {"ratio_to_total_tokens": 0.0005, "expected_training_ratio_in_superset": 0.00019047619047619045, "num_tokens": 4}, "9": {"ratio_to_total_tokens": 0.00075, "expected_training_ratio_in_superset": 0.0003214285714285714, "num_tokens": 6}, "10": {"ratio_to_total_tokens": 0.002, "expected_training_ratio_in_superset": 0.0009523809523809524, "num_tokens": 16}, "11": {"ratio_to_total_tokens": 0.001875, "expected_training_ratio_in_superset": 0.0009821428571428572, "num_tokens": 15}, "12": {"ratio_to_total_tokens": 0.002125, "expected_training_ratio_in_superset": 0.0012142857142857142, "num_tokens": 17}, "13": {"ratio_to_total_tokens": 0.002125, "expected_training_ratio_in_superset": 0.0013154761904761905, "num_tokens": 17}, "14": {"ratio_to_total_tokens": 0.003125, "expected_training_ratio_in_superset": 0.002083333333333333, "num_tokens": 25}, "15": {"ratio_to_total_tokens": 0.003625, "expected_training_ratio_in_superset": 0.0025892857142857145, "num_tokens": 29}, "16": {"ratio_to_total_tokens": 0.006625, "expected_training_ratio_in_superset": 0.005047619047619047, "num_tokens": 53}, "17": {"ratio_to_total_tokens": 0.003625, "expected_training_ratio_in_superset": 0.0029345238095238096, "num_tokens": 29}, "18": {"ratio_to_total_tokens": 0.0085, "expected_training_ratio_in_superset": 0.007285714285714286, "num_tokens": 68}, "19": {"ratio_to_total_tokens": 0.006625, "expected_training_ratio_in_superset": 0.005994047619047619, "num_tokens": 53}, "20": {"ratio_to_total_tokens": 0.00575, "expected_training_ratio_in_superset": 0.0054761904761904765, "num_tokens": 46}, "21": {"ratio_to_total_tokens": 0.050625, "expected_training_ratio_in_superset": 0.050625, "num_tokens": 405}, "total_training_compared_to_full_model": 0.13053571428571428}
|