{ "STSBenchmark": { "train": { "pearson": [ 0.7593357300138104, 0.0 ], "spearman": [ 0.7363780516874698, 0.0 ], "nsamples": 5749 }, "dev": { "pearson": [ 0.7708717320377951, 1.0423163280003215e-295 ], "spearman": [ 0.7786676025109732, 1.5214906511814883e-305 ], "nsamples": 1500 }, "test": { "pearson": [ 0.7501376173451568, 1.3467040400624944e-249 ], "spearman": [ 0.750824400583584, 2.649603496637417e-250 ], "nsamples": 1379 }, "all": { "pearson": { "all": 0.7604793924665235, "mean": 0.7601150264655875, "wmean": 0.759871173415051 }, "spearman": { "all": 0.7504771603185239, "mean": 0.7552900182606758, "wmean": 0.7460391366854991 } } }, "SICKRelatedness": { "train": { "pearson": [ 0.7662304008155296, 0.0 ], "spearman": [ 0.6902538404584456, 0.0 ], "nsamples": 4500 }, "dev": { "pearson": [ 0.7821571234476052, 2.2004576953729478e-104 ], "spearman": [ 0.7166329672415084, 5.843294318811089e-80 ], "nsamples": 500 }, "test": { "pearson": [ 0.7611310123704713, 0.0 ], "spearman": [ 0.6832295457395683, 0.0 ], "nsamples": 4927 }, "all": { "pearson": { "all": 0.7644308360476054, "mean": 0.7698395122112021, "wmean": 0.7645016483673817 }, "spearman": { "all": 0.6882116860582081, "mean": 0.6967054511465074, "wmean": 0.6880961758378777 } } }, "eval_senteval-stsb_spearman": 0.7786676025109732, "eval_senteval-sickr_spearman": 0.7166329672415084, "eval_senteval-avg_sts": 0.7476502848762407 }