| { |
| "STSBenchmark": { |
| "train": { |
| "pearson": [ |
| 0.7868313677903059, |
| 0.0 |
| ], |
| "spearman": [ |
| 0.7533061602723176, |
| 0.0 |
| ], |
| "nsamples": 5749 |
| }, |
| "dev": { |
| "pearson": [ |
| 0.8010234738701788, |
| 0.0 |
| ], |
| "spearman": [ |
| 0.8010173901569266, |
| 0.0 |
| ], |
| "nsamples": 1500 |
| }, |
| "test": { |
| "pearson": [ |
| 0.7766524771374954, |
| 1.1662374252806932e-278 |
| ], |
| "spearman": [ |
| 0.7638460069862814, |
| 3.8220116833205965e-264 |
| ], |
| "nsamples": 1379 |
| }, |
| "all": { |
| "pearson": { |
| "all": 0.7882517084559206, |
| "mean": 0.7881691062659933, |
| "wmean": 0.7876718254757005 |
| }, |
| "spearman": { |
| "all": 0.7668425138024548, |
| "mean": 0.7727231858051752, |
| "wmean": 0.7632854478761041 |
| } |
| } |
| }, |
| "SICKRelatedness": { |
| "train": { |
| "pearson": [ |
| 0.7853064744370001, |
| 0.0 |
| ], |
| "spearman": [ |
| 0.7045889188784015, |
| 0.0 |
| ], |
| "nsamples": 4500 |
| }, |
| "dev": { |
| "pearson": [ |
| 0.7952406911697713, |
| 2.6811654216760936e-110 |
| ], |
| "spearman": [ |
| 0.7309801454276812, |
| 1.0951577254305346e-84 |
| ], |
| "nsamples": 500 |
| }, |
| "test": { |
| "pearson": [ |
| 0.7794843403240526, |
| 0.0 |
| ], |
| "spearman": [ |
| 0.6977349592492605, |
| 0.0 |
| ], |
| "nsamples": 4927 |
| }, |
| "all": { |
| "pearson": { |
| "all": 0.7828650051750712, |
| "mean": 0.7866771686436079, |
| "wmean": 0.7829171779317007 |
| }, |
| "spearman": { |
| "all": 0.7025121676824595, |
| "mean": 0.7111013411851145, |
| "wmean": 0.702516404944873 |
| } |
| } |
| }, |
| "MR": { |
| "devacc": 81.09, |
| "acc": 80.59, |
| "ndev": 10662, |
| "ntest": 10662 |
| }, |
| "CR": { |
| "devacc": 87.01, |
| "acc": 86.6, |
| "ndev": 3775, |
| "ntest": 3775 |
| }, |
| "SUBJ": { |
| "devacc": 95.34, |
| "acc": 95.02, |
| "ndev": 10000, |
| "ntest": 10000 |
| }, |
| "MPQA": { |
| "devacc": 88.89, |
| "acc": 88.99, |
| "ndev": 10606, |
| "ntest": 10606 |
| }, |
| "SST2": { |
| "devacc": 84.06, |
| "acc": 84.95, |
| "ndev": 872, |
| "ntest": 1821 |
| }, |
| "TREC": { |
| "devacc": 82.7, |
| "acc": 87.2, |
| "ndev": 5452, |
| "ntest": 500 |
| }, |
| "MRPC": { |
| "devacc": 70.8, |
| "acc": 68.81, |
| "f1": 76.97, |
| "ndev": 4076, |
| "ntest": 1725 |
| }, |
| "STS12": { |
| "MSRpar": { |
| "pearson": [ |
| 0.4506656429961876, |
| 8.587667122234213e-39 |
| ], |
| "spearman": [ |
| 0.4537783738578545, |
| 2.270328303306969e-39 |
| ], |
| "nsamples": 750 |
| }, |
| "MSRvid": { |
| "pearson": [ |
| 0.8735316429807825, |
| 4.363488536726283e-236 |
| ], |
| "spearman": [ |
| 0.8745116790315722, |
| 2.8887254873277706e-237 |
| ], |
| "nsamples": 750 |
| }, |
| "SMTeuroparl": { |
| "pearson": [ |
| 0.5276646768590786, |
| 2.9080130640693665e-34 |
| ], |
| "spearman": [ |
| 0.6225349369600102, |
| 1.3236704498055218e-50 |
| ], |
| "nsamples": 459 |
| }, |
| "surprise.OnWN": { |
| "pearson": [ |
| 0.7340552729415586, |
| 7.588168789192366e-128 |
| ], |
| "spearman": [ |
| 0.6862387036955726, |
| 1.6734444180335097e-105 |
| ], |
| "nsamples": 750 |
| }, |
| "surprise.SMTnews": { |
| "pearson": [ |
| 0.6554833920285361, |
| 2.382715639542081e-50 |
| ], |
| "spearman": [ |
| 0.6338572026855626, |
| 3.2084519789805647e-46 |
| ], |
| "nsamples": 399 |
| }, |
| "all": { |
| "pearson": { |
| "all": 0.667994262204242, |
| "mean": 0.6482801255612287, |
| "wmean": 0.6587597745452379 |
| }, |
| "spearman": { |
| "all": 0.6198695741812278, |
| "mean": 0.6541841792461144, |
| "wmean": 0.659443091175976 |
| } |
| } |
| }, |
| "STS13": { |
| "FNWN": { |
| "pearson": [ |
| 0.570828218970704, |
| 9.847987645161228e-18 |
| ], |
| "spearman": [ |
| 0.6046232001507675, |
| 3.1840503190651897e-20 |
| ], |
| "nsamples": 189 |
| }, |
| "headlines": { |
| "pearson": [ |
| 0.7995020825200164, |
| 9.500980524179015e-168 |
| ], |
| "spearman": [ |
| 0.8125460785135767, |
| 1.649528631120915e-177 |
| ], |
| "nsamples": 750 |
| }, |
| "OnWN": { |
| "pearson": [ |
| 0.7844322816916485, |
| 4.612357080156043e-118 |
| ], |
| "spearman": [ |
| 0.7801367000550998, |
| 5.871872377147612e-116 |
| ], |
| "nsamples": 561 |
| }, |
| "all": { |
| "pearson": { |
| "all": 0.7407620228952401, |
| "mean": 0.718254194394123, |
| "wmean": 0.7650530702029934 |
| }, |
| "spearman": { |
| "all": 0.7458274512781141, |
| "mean": 0.7324353262398148, |
| "wmean": 0.7742266882963925 |
| } |
| } |
| }, |
| "STS14": { |
| "deft-forum": { |
| "pearson": [ |
| 0.5631321216962222, |
| 5.210192672663357e-39 |
| ], |
| "spearman": [ |
| 0.5511772152789268, |
| 4.031968923211026e-37 |
| ], |
| "nsamples": 450 |
| }, |
| "deft-news": { |
| "pearson": [ |
| 0.7692532638001923, |
| 6.387272025432673e-60 |
| ], |
| "spearman": [ |
| 0.7225821241233733, |
| 1.0522226454927607e-49 |
| ], |
| "nsamples": 300 |
| }, |
| "headlines": { |
| "pearson": [ |
| 0.7685532605008147, |
| 3.1092413652073723e-147 |
| ], |
| "spearman": [ |
| 0.72597520728351, |
| 9.721513948491652e-124 |
| ], |
| "nsamples": 750 |
| }, |
| "images": { |
| "pearson": [ |
| 0.8353848860067018, |
| 1.3687751285353585e-196 |
| ], |
| "spearman": [ |
| 0.8008852796417836, |
| 9.492757773828998e-169 |
| ], |
| "nsamples": 750 |
| }, |
| "OnWN": { |
| "pearson": [ |
| 0.8314850837955547, |
| 3.9440310563877586e-193 |
| ], |
| "spearman": [ |
| 0.8316458764161619, |
| 2.851406716141642e-193 |
| ], |
| "nsamples": 750 |
| }, |
| "tweet-news": { |
| "pearson": [ |
| 0.7778758524787571, |
| 4.607989885863323e-153 |
| ], |
| "spearman": [ |
| 0.6958906739489547, |
| 1.1738361486418922e-109 |
| ], |
| "nsamples": 750 |
| }, |
| "all": { |
| "pearson": { |
| "all": 0.73992310716163, |
| "mean": 0.7576140780463737, |
| "wmean": 0.7717759322639277 |
| }, |
| "spearman": { |
| "all": 0.6864467990669687, |
| "mean": 0.7213593961154516, |
| "wmean": 0.734827243221423 |
| } |
| } |
| }, |
| "STS15": { |
| "answers-forums": { |
| "pearson": [ |
| 0.7391296029963142, |
| 5.385805927099778e-66 |
| ], |
| "spearman": [ |
| 0.7409312029744309, |
| 1.789609179402688e-66 |
| ], |
| "nsamples": 375 |
| }, |
| "answers-students": { |
| "pearson": [ |
| 0.7026326622651042, |
| 1.1706959560110963e-112 |
| ], |
| "spearman": [ |
| 0.7107886172788801, |
| 2.1014876744572312e-116 |
| ], |
| "nsamples": 750 |
| }, |
| "belief": { |
| "pearson": [ |
| 0.8006281964159404, |
| 5.439878843301103e-85 |
| ], |
| "spearman": [ |
| 0.8172868949869829, |
| 2.543177483321865e-91 |
| ], |
| "nsamples": 375 |
| }, |
| "headlines": { |
| "pearson": [ |
| 0.8172091326355518, |
| 3.472486751097505e-181 |
| ], |
| "spearman": [ |
| 0.8158723780481846, |
| 4.030205865269612e-180 |
| ], |
| "nsamples": 750 |
| }, |
| "images": { |
| "pearson": [ |
| 0.8784869743544939, |
| 3.750940760878824e-242 |
| ], |
| "spearman": [ |
| 0.8806887757856461, |
| 6.211464354884257e-245 |
| ], |
| "nsamples": 750 |
| }, |
| "all": { |
| "pearson": { |
| "all": 0.7913051772787048, |
| "mean": 0.787617313733481, |
| "wmean": 0.7920519172403193 |
| }, |
| "spearman": { |
| "all": 0.7986117512115241, |
| "mean": 0.7931135738148248, |
| "wmean": 0.7966147050233544 |
| } |
| } |
| }, |
| "STS16": { |
| "answer-answer": { |
| "pearson": [ |
| 0.7177168935513755, |
| 1.7118144003107402e-41 |
| ], |
| "spearman": [ |
| 0.7132893030185777, |
| 8.841119832138394e-41 |
| ], |
| "nsamples": 254 |
| }, |
| "headlines": { |
| "pearson": [ |
| 0.7910112149047425, |
| 1.2553390356155912e-54 |
| ], |
| "spearman": [ |
| 0.8059772680734066, |
| 3.561704789876049e-58 |
| ], |
| "nsamples": 249 |
| }, |
| "plagiarism": { |
| "pearson": [ |
| 0.8146246368802861, |
| 7.416724178775043e-56 |
| ], |
| "spearman": [ |
| 0.8287733749128491, |
| 2.0728091350119785e-59 |
| ], |
| "nsamples": 230 |
| }, |
| "postediting": { |
| "pearson": [ |
| 0.8358664674126319, |
| 5.627683437146896e-65 |
| ], |
| "spearman": [ |
| 0.8514410852739017, |
| 8.855209165489321e-70 |
| ], |
| "nsamples": 244 |
| }, |
| "question-question": { |
| "pearson": [ |
| 0.7757563825820808, |
| 2.9043591729136265e-43 |
| ], |
| "spearman": [ |
| 0.7882765418102572, |
| 1.5472955880308416e-45 |
| ], |
| "nsamples": 209 |
| }, |
| "all": { |
| "pearson": { |
| "all": 0.7727412422624585, |
| "mean": 0.7869951190662233, |
| "wmean": 0.7864334333593027 |
| }, |
| "spearman": { |
| "all": 0.7823935956761426, |
| "mean": 0.7975515146177985, |
| "wmean": 0.7967817209039866 |
| } |
| } |
| }, |
| "eval_senteval-STS12": 0.6198695741812278, |
| "eval_senteval-STS13": 0.7458274512781141, |
| "eval_senteval-STS14": 0.6864467990669687, |
| "eval_senteval-STS15": 0.7986117512115241, |
| "eval_senteval-STS16": 0.7823935956761426, |
| "eval_senteval-STSBenchmark": 0.7668425138024548, |
| "eval_senteval-SICKRelatedness": 0.7025121676824595, |
| "eval_senteval-avg_sts_7": 0.7289291218426988, |
| "eval_senteval-MR": 81.09, |
| "eval_senteval-CR": 87.01, |
| "eval_senteval-SUBJ": 95.34, |
| "eval_senteval-MPQA": 88.89, |
| "eval_senteval-SST2": 84.06, |
| "eval_senteval-TREC": 82.7, |
| "eval_senteval-MRPC": 70.8, |
| "eval_senteval-avg_transfer": 84.27 |
| } |
|
|