gsaltintas commited on
Commit
519ebe1
·
verified ·
1 Parent(s): dde88d0

Upload script_1/flexitok--bpe_script_Germ_32000_overlap.json with huggingface_hub

Browse files
script_1/flexitok--bpe_script_Germ_32000_overlap.json CHANGED
@@ -1 +1 @@
1
- {"1": {"ratio_to_total_tokens": 0.6438764643237487, "expected_training_ratio_in_superset": 0.058534224029431696, "num_tokens": 21161}, "2": {"ratio_to_total_tokens": 0.09773315076829454, "expected_training_ratio_in_superset": 0.017769663776053553, "num_tokens": 3212}, "3": {"ratio_to_total_tokens": 0.08516659059790051, "expected_training_ratio_in_superset": 0.02322725198124559, "num_tokens": 2799}, "4": {"ratio_to_total_tokens": 0.05020538566864446, "expected_training_ratio_in_superset": 0.018256503879507075, "num_tokens": 1650}, "5": {"ratio_to_total_tokens": 0.02951468127186977, "expected_training_ratio_in_superset": 0.013415764214486259, "num_tokens": 970}, "6": {"ratio_to_total_tokens": 0.017404533698463412, "expected_training_ratio_in_superset": 0.009493382017343678, "num_tokens": 572}, "7": {"ratio_to_total_tokens": 0.01323596531264263, "expected_training_ratio_in_superset": 0.008422887017136218, "num_tokens": 435}, "8": {"ratio_to_total_tokens": 0.007454739084132056, "expected_training_ratio_in_superset": 0.005421628424823313, "num_tokens": 245}, "9": {"ratio_to_total_tokens": 0.0033165982047771185, "expected_training_ratio_in_superset": 0.002713580349363097, "num_tokens": 109}, "10": {"ratio_to_total_tokens": 0.003468735737106344, "expected_training_ratio_in_superset": 0.0031533961246421305, "num_tokens": 114}, "11": {"ratio_to_total_tokens": 0.04862315533242051, "expected_training_ratio_in_superset": 0.04862315533242051, "num_tokens": 1598}, "total_training_compared_to_full_model": 0.20903143714645311}
 
1
+ {"1": {"ratio_to_total_tokens": 0.665023581317511, "expected_training_ratio_in_superset": 0.060456689210682826, "num_tokens": 21856}, "2": {"ratio_to_total_tokens": 0.1039099345808611, "expected_training_ratio_in_superset": 0.01889271537833838, "num_tokens": 3415}, "3": {"ratio_to_total_tokens": 0.06922257720979766, "expected_training_ratio_in_superset": 0.018878884693581177, "num_tokens": 2275}, "4": {"ratio_to_total_tokens": 0.044089456869009586, "expected_training_ratio_in_superset": 0.016032529770548937, "num_tokens": 1449}, "5": {"ratio_to_total_tokens": 0.02647193062528526, "expected_training_ratio_in_superset": 0.012032695738766025, "num_tokens": 870}, "6": {"ratio_to_total_tokens": 0.016948121101475734, "expected_training_ratio_in_superset": 0.009244429691714037, "num_tokens": 557}, "7": {"ratio_to_total_tokens": 0.012657842689791572, "expected_training_ratio_in_superset": 0.008054990802594636, "num_tokens": 416}, "8": {"ratio_to_total_tokens": 0.00724174653887114, "expected_training_ratio_in_superset": 0.005266724755542647, "num_tokens": 238}, "9": {"ratio_to_total_tokens": 0.0030427506465845124, "expected_training_ratio_in_superset": 0.0024895232562964194, "num_tokens": 100}, "10": {"ratio_to_total_tokens": 0.0030427506465845124, "expected_training_ratio_in_superset": 0.0027661369514404657, "num_tokens": 100}, "11": {"ratio_to_total_tokens": 0.048349307774227905, "expected_training_ratio_in_superset": 0.048349307774227905, "num_tokens": 1589}, "total_training_compared_to_full_model": 0.20246462802373347}