gsaltintas commited on
Commit
3c65d02
·
verified ·
1 Parent(s): 9cb8191

Upload script_1/flexitok--bpe_script_Arab_16000_overlap.json with huggingface_hub

Browse files
script_1/flexitok--bpe_script_Arab_16000_overlap.json CHANGED
@@ -1 +1 @@
1
- {"1": {"ratio_to_total_tokens": 0.8657147914331229, "expected_training_ratio_in_superset": 0.07870134467573844, "num_tokens": 14673}, "2": {"ratio_to_total_tokens": 0.00430703876334887, "expected_training_ratio_in_superset": 0.0007830979569725219, "num_tokens": 73}, "3": {"ratio_to_total_tokens": 0.002419021771195941, "expected_training_ratio_in_superset": 0.0006597332103261657, "num_tokens": 41}, "4": {"ratio_to_total_tokens": 0.0018880169921529294, "expected_training_ratio_in_superset": 0.0006865516335101562, "num_tokens": 32}, "5": {"ratio_to_total_tokens": 0.003540031860286743, "expected_training_ratio_in_superset": 0.0016091053910394285, "num_tokens": 60}, "6": {"ratio_to_total_tokens": 0.004189037701339312, "expected_training_ratio_in_superset": 0.002284929655275988, "num_tokens": 71}, "7": {"ratio_to_total_tokens": 0.005369048321434893, "expected_training_ratio_in_superset": 0.003416667113640386, "num_tokens": 91}, "8": {"ratio_to_total_tokens": 0.005841052569473125, "expected_training_ratio_in_superset": 0.004248038232344091, "num_tokens": 99}, "9": {"ratio_to_total_tokens": 0.005841052569473125, "expected_training_ratio_in_superset": 0.004779043011387102, "num_tokens": 99}, "10": {"ratio_to_total_tokens": 0.006608059472535253, "expected_training_ratio_in_superset": 0.006007326793213866, "num_tokens": 112}, "11": {"ratio_to_total_tokens": 0.09428284854563691, "expected_training_ratio_in_superset": 0.09428284854563691, "num_tokens": 1598}, "total_training_compared_to_full_model": 0.19745868621908505}
 
1
+ {"1": {"ratio_to_total_tokens": 0.8760023584905661, "expected_training_ratio_in_superset": 0.07963657804459692, "num_tokens": 14857}, "2": {"ratio_to_total_tokens": 0.0030070754716981134, "expected_training_ratio_in_superset": 0.0005467409948542025, "num_tokens": 51}, "3": {"ratio_to_total_tokens": 0.0015330188679245284, "expected_training_ratio_in_superset": 0.00041809605488850766, "num_tokens": 26}, "4": {"ratio_to_total_tokens": 0.0018278301886792453, "expected_training_ratio_in_superset": 0.0006646655231560892, "num_tokens": 31}, "5": {"ratio_to_total_tokens": 0.002240566037735849, "expected_training_ratio_in_superset": 0.0010184391080617495, "num_tokens": 38}, "6": {"ratio_to_total_tokens": 0.00294811320754717, "expected_training_ratio_in_superset": 0.0016080617495711834, "num_tokens": 50}, "7": {"ratio_to_total_tokens": 0.0039504716981132075, "expected_training_ratio_in_superset": 0.00251393653516295, "num_tokens": 67}, "8": {"ratio_to_total_tokens": 0.004304245283018868, "expected_training_ratio_in_superset": 0.003130360205831904, "num_tokens": 73}, "9": {"ratio_to_total_tokens": 0.004834905660377358, "expected_training_ratio_in_superset": 0.003955831903945111, "num_tokens": 82}, "10": {"ratio_to_total_tokens": 0.005660377358490566, "expected_training_ratio_in_superset": 0.005145797598627787, "num_tokens": 96}, "11": {"ratio_to_total_tokens": 0.09369103773584905, "expected_training_ratio_in_superset": 0.09369103773584905, "num_tokens": 1589}, "total_training_compared_to_full_model": 0.19232954545454545}