hpprc commited on Apr 14

Commit

0d37081

verified ·

1 Parent(s): 7886bde

Upload 17 files

Browse files

Files changed (17) hide show

results-len512/Classification/scores_amazon_counterfactual_classification.json +23 -0
results-len512/Classification/scores_amazon_review_classification.json +23 -0
results-len512/Classification/scores_massive_intent_classification.json +23 -0
results-len512/Classification/scores_massive_scenario_classification.json +23 -0
results-len512/Clustering/scores_livedoor_news.json +36 -0
results-len512/Clustering/scores_mewsc16.json +36 -0
results-len512/PairClassification/scores_paws_x_ja.json +41 -0
results-len512/Reranking/scores_esci.json +31 -0
results-len512/Retrieval/scores_jagovfaqs_22k.json +43 -0
results-len512/Retrieval/scores_jaqket.json +43 -0
results-len512/Retrieval/scores_mrtydi.json +43 -0
results-len512/Retrieval/scores_nlp_journal_abs_intro.json +43 -0
results-len512/Retrieval/scores_nlp_journal_title_abs.json +43 -0
results-len512/Retrieval/scores_nlp_journal_title_intro.json +43 -0
results-len512/STS/scores_jsick.json +31 -0
results-len512/STS/scores_jsts.json +31 -0
results-len512/summary.json +62 -0

results-len512/Classification/scores_amazon_counterfactual_classification.json ADDED Viewed

	@@ -0,0 +1,23 @@

+{
+    "metric_name": "macro_f1",
+    "metric_value": 0.8076989283604759,
+    "details": {
+        "optimal_classifier_name": "logreg",
+        "val_scores": {
+            "knn_cosine_k_2": {
+                "accuracy": 0.9098712446351931,
+                "macro_f1": 0.6259174311926605
+            },
+            "logreg": {
+                "accuracy": 0.9120171673819742,
+                "macro_f1": 0.7401074610623682
+            }
+        },
+        "test_scores": {
+            "logreg": {
+                "accuracy": 0.9346895074946466,
+                "macro_f1": 0.8076989283604759
+            }
+        }
+    }
+}

results-len512/Classification/scores_amazon_review_classification.json ADDED Viewed

	@@ -0,0 +1,23 @@

+{
+    "metric_name": "macro_f1",
+    "metric_value": 0.6002930507515865,
+    "details": {
+        "optimal_classifier_name": "logreg",
+        "val_scores": {
+            "knn_cosine_k_2": {
+                "accuracy": 0.4572,
+                "macro_f1": 0.4502483462385972
+            },
+            "logreg": {
+                "accuracy": 0.6088,
+                "macro_f1": 0.6028591976118355
+            }
+        },
+        "test_scores": {
+            "logreg": {
+                "accuracy": 0.6054,
+                "macro_f1": 0.6002930507515865
+            }
+        }
+    }
+}

results-len512/Classification/scores_massive_intent_classification.json ADDED Viewed

	@@ -0,0 +1,23 @@

+{
+    "metric_name": "macro_f1",
+    "metric_value": 0.7927230771632646,
+    "details": {
+        "optimal_classifier_name": "logreg",
+        "val_scores": {
+            "knn_cosine_k_2": {
+                "accuracy": 0.7712739793408756,
+                "macro_f1": 0.7556875588894797
+            },
+            "logreg": {
+                "accuracy": 0.8327594687653713,
+                "macro_f1": 0.8262484502743833
+            }
+        },
+        "test_scores": {
+            "logreg": {
+                "accuracy": 0.8298587760591796,
+                "macro_f1": 0.7927230771632646
+            }
+        }
+    }
+}

results-len512/Classification/scores_massive_scenario_classification.json ADDED Viewed

	@@ -0,0 +1,23 @@

+{
+    "metric_name": "macro_f1",
+    "metric_value": 0.8836398132177599,
+    "details": {
+        "optimal_classifier_name": "logreg",
+        "val_scores": {
+            "knn_cosine_k_2": {
+                "accuracy": 0.8657156910969012,
+                "macro_f1": 0.859699565451082
+            },
+            "logreg": {
+                "accuracy": 0.882439744220364,
+                "macro_f1": 0.8795176163694028
+            }
+        },
+        "test_scores": {
+            "logreg": {
+                "accuracy": 0.8856758574310692,
+                "macro_f1": 0.8836398132177599
+            }
+        }
+    }
+}

results-len512/Clustering/scores_livedoor_news.json ADDED Viewed

	@@ -0,0 +1,36 @@

+{
+    "metric_name": "v_measure_score",
+    "metric_value": 0.6039269159025831,
+    "details": {
+        "optimal_clustering_model_name": "MiniBatchKMeans",
+        "val_scores": {
+            "MiniBatchKMeans": {
+                "v_measure_score": 0.5960385156082993,
+                "homogeneity_score": 0.5901260734047985,
+                "completeness_score": 0.6020706296953126
+            },
+            "AgglomerativeClustering": {
+                "v_measure_score": 0.583716765442441,
+                "homogeneity_score": 0.5673363073951831,
+                "completeness_score": 0.6010712376730697
+            },
+            "BisectingKMeans": {
+                "v_measure_score": 0.555434369511391,
+                "homogeneity_score": 0.5533062994229689,
+                "completeness_score": 0.557578872332676
+            },
+            "Birch": {
+                "v_measure_score": 0.583716765442441,
+                "homogeneity_score": 0.5673363073951831,
+                "completeness_score": 0.6010712376730697
+            }
+        },
+        "test_scores": {
+            "MiniBatchKMeans": {
+                "v_measure_score": 0.6039269159025831,
+                "homogeneity_score": 0.5959125218894525,
+                "completeness_score": 0.6121598189000157
+            }
+        }
+    }
+}

results-len512/Clustering/scores_mewsc16.json ADDED Viewed

	@@ -0,0 +1,36 @@

+{
+    "metric_name": "v_measure_score",
+    "metric_value": 0.5133038855338062,
+    "details": {
+        "optimal_clustering_model_name": "Birch",
+        "val_scores": {
+            "MiniBatchKMeans": {
+                "v_measure_score": 0.510867661944874,
+                "homogeneity_score": 0.5605115011968407,
+                "completeness_score": 0.469302128698923
+            },
+            "AgglomerativeClustering": {
+                "v_measure_score": 0.5147662040011469,
+                "homogeneity_score": 0.5531310208295678,
+                "completeness_score": 0.48137812268486785
+            },
+            "BisectingKMeans": {
+                "v_measure_score": 0.4918319882518622,
+                "homogeneity_score": 0.5376041031234438,
+                "completeness_score": 0.45324249905198777
+            },
+            "Birch": {
+                "v_measure_score": 0.51740915477174,
+                "homogeneity_score": 0.5588139550196363,
+                "completeness_score": 0.4817167967576891
+            }
+        },
+        "test_scores": {
+            "Birch": {
+                "v_measure_score": 0.5133038855338062,
+                "homogeneity_score": 0.5481383517989595,
+                "completeness_score": 0.4826323579250646
+            }
+        }
+    }
+}

results-len512/PairClassification/scores_paws_x_ja.json ADDED Viewed

	@@ -0,0 +1,41 @@

+{
+    "metric_name": "binary_f1",
+    "metric_value": 0.6225736879942487,
+    "details": {
+        "optimal_distance_metric": "dot_similarities",
+        "val_scores": {
+            "cosine_distances": {
+                "accuracy": 0.5725,
+                "accuracy_threshold": 0.7325698733329773,
+                "binary_f1": 0.5979670522257273,
+                "binary_f1_threshold": 1.0
+            },
+            "manhatten_distances": {
+                "accuracy": 0.6075,
+                "accuracy_threshold": 91.31901550292969,
+                "binary_f1": 0.6016949152542372,
+                "binary_f1_threshold": 786.4454956054688
+            },
+            "euclidean_distances": {
+                "accuracy": 0.6075,
+                "accuracy_threshold": 5.207228660583496,
+                "binary_f1": 0.6016949152542372,
+                "binary_f1_threshold": 45.460025787353516
+            },
+            "dot_similarities": {
+                "accuracy": 0.5825,
+                "accuracy_threshold": 6222.314453125,
+                "binary_f1": 0.6046176046176047,
+                "binary_f1_threshold": 5251.693359375
+            }
+        },
+        "test_scores": {
+            "dot_similarities": {
+                "accuracy": 0.5705,
+                "accuracy_threshold": 6222.314453125,
+                "binary_f1": 0.6225736879942487,
+                "binary_f1_threshold": 5251.693359375
+            }
+        }
+    }
+}

results-len512/Reranking/scores_esci.json ADDED Viewed

	@@ -0,0 +1,31 @@

+{
+    "metric_name": "ndcg@10",
+    "metric_value": 0.9334575664125155,
+    "details": {
+        "optimal_distance_metric": "euclidean_distance",
+        "val_scores": {
+            "cosine_similarity": {
+                "ndcg@10": 0.9480715786819617,
+                "ndcg@20": 0.9588590589385586,
+                "ndcg@40": 0.9663121013878336
+            },
+            "dot_score": {
+                "ndcg@10": 0.9320754586179866,
+                "ndcg@20": 0.9468361394565974,
+                "ndcg@40": 0.9554828676062351
+            },
+            "euclidean_distance": {
+                "ndcg@10": 0.9482545881429024,
+                "ndcg@20": 0.9589918342682602,
+                "ndcg@40": 0.9664476093776743
+            }
+        },
+        "test_scores": {
+            "euclidean_distance": {
+                "ndcg@10": 0.9334575664125155,
+                "ndcg@20": 0.9499440970639671,
+                "ndcg@40": 0.9591420703620055
+            }
+        }
+    }
+}

results-len512/Retrieval/scores_jagovfaqs_22k.json ADDED Viewed

	@@ -0,0 +1,43 @@

+{
+    "metric_name": "ndcg@10",
+    "metric_value": 0.7664675957880878,
+    "details": {
+        "optimal_distance_metric": "cosine_similarity",
+        "val_scores": {
+            "cosine_similarity": {
+                "accuracy@1": 0.6341035390465048,
+                "accuracy@3": 0.8008189529102077,
+                "accuracy@5": 0.8470312957004972,
+                "accuracy@10": 0.8900263234863995,
+                "ndcg@10": 0.7660561172829335,
+                "mrr@10": 0.7258752443163089
+            },
+            "dot_score": {
+                "accuracy@1": 0.3208540508920737,
+                "accuracy@3": 0.5013161743199765,
+                "accuracy@5": 0.5764843521497514,
+                "accuracy@10": 0.6689090377303305,
+                "ndcg@10": 0.4876219735593598,
+                "mrr@10": 0.4305070404880283
+            },
+            "euclidean_distance": {
+                "accuracy@1": 0.6314711904065516,
+                "accuracy@3": 0.7987715706346885,
+                "accuracy@5": 0.8455688797894121,
+                "accuracy@10": 0.8873939748464463,
+                "ndcg@10": 0.7635587399092253,
+                "mrr@10": 0.7234064309159369
+            }
+        },
+        "test_scores": {
+            "cosine_similarity": {
+                "accuracy@1": 0.6359649122807017,
+                "accuracy@3": 0.8011695906432749,
+                "accuracy@5": 0.8482456140350877,
+                "accuracy@10": 0.887719298245614,
+                "ndcg@10": 0.7664675957880878,
+                "mrr@10": 0.7270308874036948
+            }
+        }
+    }
+}

results-len512/Retrieval/scores_jaqket.json ADDED Viewed

	@@ -0,0 +1,43 @@

+{
+    "metric_name": "ndcg@10",
+    "metric_value": 0.7180699960435167,
+    "details": {
+        "optimal_distance_metric": "cosine_similarity",
+        "val_scores": {
+            "cosine_similarity": {
+                "accuracy@1": 0.5618090452261306,
+                "accuracy@3": 0.7577889447236181,
+                "accuracy@5": 0.7919597989949749,
+                "accuracy@10": 0.8381909547738694,
+                "ndcg@10": 0.7084681554153308,
+                "mrr@10": 0.6660417165191037
+            },
+            "dot_score": {
+                "accuracy@1": 0.43517587939698493,
+                "accuracy@3": 0.6231155778894473,
+                "accuracy@5": 0.6814070351758794,
+                "accuracy@10": 0.7437185929648241,
+                "ndcg@10": 0.5904434310879052,
+                "mrr@10": 0.5413404323203317
+            },
+            "euclidean_distance": {
+                "accuracy@1": 0.5487437185929648,
+                "accuracy@3": 0.749748743718593,
+                "accuracy@5": 0.7849246231155779,
+                "accuracy@10": 0.8311557788944723,
+                "ndcg@10": 0.6974016012793113,
+                "mrr@10": 0.6538426258275508
+            }
+        },
+        "test_scores": {
+            "cosine_similarity": {
+                "accuracy@1": 0.567703109327984,
+                "accuracy@3": 0.757271815446339,
+                "accuracy@5": 0.8164493480441324,
+                "accuracy@10": 0.8565697091273822,
+                "ndcg@10": 0.7180699960435167,
+                "mrr@10": 0.6729501998057665
+            }
+        }
+    }
+}

results-len512/Retrieval/scores_mrtydi.json ADDED Viewed

	@@ -0,0 +1,43 @@

+{
+    "metric_name": "ndcg@10",
+    "metric_value": 0.47178534512951525,
+    "details": {
+        "optimal_distance_metric": "euclidean_distance",
+        "val_scores": {
+            "cosine_similarity": {
+                "accuracy@1": 0.3900862068965517,
+                "accuracy@3": 0.5711206896551724,
+                "accuracy@5": 0.6325431034482759,
+                "accuracy@10": 0.7036637931034483,
+                "ndcg@10": 0.5437386125657795,
+                "mrr@10": 0.4929734537493152
+            },
+            "dot_score": {
+                "accuracy@1": 0.15301724137931033,
+                "accuracy@3": 0.26185344827586204,
+                "accuracy@5": 0.3103448275862069,
+                "accuracy@10": 0.37823275862068967,
+                "ndcg@10": 0.2583544424007982,
+                "mrr@10": 0.22087181855500812
+            },
+            "euclidean_distance": {
+                "accuracy@1": 0.3933189655172414,
+                "accuracy@3": 0.5732758620689655,
+                "accuracy@5": 0.6314655172413793,
+                "accuracy@10": 0.7025862068965517,
+                "ndcg@10": 0.5458202479710179,
+                "mrr@10": 0.4958350437876296
+            }
+        },
+        "test_scores": {
+            "euclidean_distance": {
+                "accuracy@1": 0.33611111111111114,
+                "accuracy@3": 0.5291666666666667,
+                "accuracy@5": 0.6069444444444444,
+                "accuracy@10": 0.6805555555555556,
+                "ndcg@10": 0.47178534512951525,
+                "mrr@10": 0.44654872134038764
+            }
+        }
+    }
+}

results-len512/Retrieval/scores_nlp_journal_abs_intro.json ADDED Viewed

	@@ -0,0 +1,43 @@

+{
+    "metric_name": "ndcg@10",
+    "metric_value": 0.9611129584687909,
+    "details": {
+        "optimal_distance_metric": "euclidean_distance",
+        "val_scores": {
+            "cosine_similarity": {
+                "accuracy@1": 0.8852459016393442,
+                "accuracy@3": 0.9508196721311475,
+                "accuracy@5": 0.9836065573770492,
+                "accuracy@10": 0.9918032786885246,
+                "ndcg@10": 0.9416795109749949,
+                "mrr@10": 0.9252146760343483
+            },
+            "dot_score": {
+                "accuracy@1": 0.7704918032786885,
+                "accuracy@3": 0.8688524590163934,
+                "accuracy@5": 0.8852459016393442,
+                "accuracy@10": 0.9344262295081968,
+                "ndcg@10": 0.8509358984819808,
+                "mrr@10": 0.8242909185532137
+            },
+            "euclidean_distance": {
+                "accuracy@1": 0.8852459016393442,
+                "accuracy@3": 0.9672131147540983,
+                "accuracy@5": 0.9754098360655737,
+                "accuracy@10": 0.9918032786885246,
+                "ndcg@10": 0.9436379619364552,
+                "mrr@10": 0.9276736924277909
+            }
+        },
+        "test_scores": {
+            "euclidean_distance": {
+                "accuracy@1": 0.9308943089430894,
+                "accuracy@3": 0.9695121951219512,
+                "accuracy@5": 0.9796747967479674,
+                "accuracy@10": 0.9878048780487805,
+                "ndcg@10": 0.9611129584687909,
+                "mrr@10": 0.9523736933797909
+            }
+        }
+    }
+}

results-len512/Retrieval/scores_nlp_journal_title_abs.json ADDED Viewed

	@@ -0,0 +1,43 @@

+{
+    "metric_name": "ndcg@10",
+    "metric_value": 0.9812952838148481,
+    "details": {
+        "optimal_distance_metric": "cosine_similarity",
+        "val_scores": {
+            "cosine_similarity": {
+                "accuracy@1": 0.9590163934426229,
+                "accuracy@3": 0.9836065573770492,
+                "accuracy@5": 1.0,
+                "accuracy@10": 1.0,
+                "ndcg@10": 0.9812321198854286,
+                "mrr@10": 0.975
+            },
+            "dot_score": {
+                "accuracy@1": 0.680327868852459,
+                "accuracy@3": 0.8852459016393442,
+                "accuracy@5": 0.9344262295081968,
+                "accuracy@10": 0.9754098360655737,
+                "ndcg@10": 0.8353833079929985,
+                "mrr@10": 0.7894320843091334
+            },
+            "euclidean_distance": {
+                "accuracy@1": 0.9590163934426229,
+                "accuracy@3": 0.9836065573770492,
+                "accuracy@5": 1.0,
+                "accuracy@10": 1.0,
+                "ndcg@10": 0.9812321198854286,
+                "mrr@10": 0.975
+            }
+        },
+        "test_scores": {
+            "cosine_similarity": {
+                "accuracy@1": 0.959349593495935,
+                "accuracy@3": 0.9939024390243902,
+                "accuracy@5": 0.9939024390243902,
+                "accuracy@10": 0.9959349593495935,
+                "ndcg@10": 0.9812952838148481,
+                "mrr@10": 0.9762388695315525
+            }
+        }
+    }
+}

results-len512/Retrieval/scores_nlp_journal_title_intro.json ADDED Viewed

	@@ -0,0 +1,43 @@

+{
+    "metric_name": "ndcg@10",
+    "metric_value": 0.8825842093499676,
+    "details": {
+        "optimal_distance_metric": "cosine_similarity",
+        "val_scores": {
+            "cosine_similarity": {
+                "accuracy@1": 0.7459016393442623,
+                "accuracy@3": 0.860655737704918,
+                "accuracy@5": 0.9098360655737705,
+                "accuracy@10": 0.9344262295081968,
+                "ndcg@10": 0.84056074193758,
+                "mrr@10": 0.8101775956284151
+            },
+            "dot_score": {
+                "accuracy@1": 0.5819672131147541,
+                "accuracy@3": 0.7704918032786885,
+                "accuracy@5": 0.819672131147541,
+                "accuracy@10": 0.8770491803278688,
+                "ndcg@10": 0.7296021589345921,
+                "mrr@10": 0.6820582877959928
+            },
+            "euclidean_distance": {
+                "accuracy@1": 0.7295081967213115,
+                "accuracy@3": 0.8688524590163934,
+                "accuracy@5": 0.9098360655737705,
+                "accuracy@10": 0.9262295081967213,
+                "ndcg@10": 0.832395357779658,
+                "mrr@10": 0.8017304189435336
+            }
+        },
+        "test_scores": {
+            "cosine_similarity": {
+                "accuracy@1": 0.7987804878048781,
+                "accuracy@3": 0.9024390243902439,
+                "accuracy@5": 0.9390243902439024,
+                "accuracy@10": 0.9613821138211383,
+                "ndcg@10": 0.8825842093499676,
+                "mrr@10": 0.8569573493353979
+            }
+        }
+    }
+}

results-len512/STS/scores_jsick.json ADDED Viewed

	@@ -0,0 +1,31 @@

+{
+    "metric_name": "spearman",
+    "metric_value": 0.7464955416231873,
+    "details": {
+        "optimal_similarity_metric": "manhatten_distance",
+        "val_scores": {
+            "cosine_similarity": {
+                "pearson": 0.7836218434851538,
+                "spearman": 0.756430688801211
+            },
+            "manhatten_distance": {
+                "pearson": 0.7923932174397492,
+                "spearman": 0.7607985259507607
+            },
+            "euclidean_distance": {
+                "pearson": 0.7923932174397492,
+                "spearman": 0.7607985259507607
+            },
+            "dot_score": {
+                "pearson": 0.5635997924106966,
+                "spearman": 0.5248804985646915
+            }
+        },
+        "test_scores": {
+            "manhatten_distance": {
+                "pearson": 0.7817941273703908,
+                "spearman": 0.7464955416231873
+            }
+        }
+    }
+}

results-len512/STS/scores_jsts.json ADDED Viewed

	@@ -0,0 +1,31 @@

+{
+    "metric_name": "spearman",
+    "metric_value": 0.8385298782229563,
+    "details": {
+        "optimal_similarity_metric": "manhatten_distance",
+        "val_scores": {
+            "cosine_similarity": {
+                "pearson": 0.8486043626272783,
+                "spearman": 0.8120034758535889
+            },
+            "manhatten_distance": {
+                "pearson": 0.855291696445933,
+                "spearman": 0.8162534021929027
+            },
+            "euclidean_distance": {
+                "pearson": 0.855291696445933,
+                "spearman": 0.8162534021929027
+            },
+            "dot_score": {
+                "pearson": 0.6439197584013935,
+                "spearman": 0.5839306171056204
+            }
+        },
+        "test_scores": {
+            "manhatten_distance": {
+                "pearson": 0.8750297182135832,
+                "spearman": 0.8385298782229563
+            }
+        }
+    }
+}

results-len512/summary.json ADDED Viewed

	@@ -0,0 +1,62 @@

+{
+    "Classification": {
+        "amazon_counterfactual_classification": {
+            "macro_f1": 0.8076989283604759
+        },
+        "amazon_review_classification": {
+            "macro_f1": 0.6002930507515865
+        },
+        "massive_intent_classification": {
+            "macro_f1": 0.7927230771632646
+        },
+        "massive_scenario_classification": {
+            "macro_f1": 0.8836398132177599
+        }
+    },
+    "Reranking": {
+        "esci": {
+            "ndcg@10": 0.9334575664125155
+        }
+    },
+    "Retrieval": {
+        "jagovfaqs_22k": {
+            "ndcg@10": 0.7664675957880878
+        },
+        "jaqket": {
+            "ndcg@10": 0.7180699960435167
+        },
+        "mrtydi": {
+            "ndcg@10": 0.47178534512951525
+        },
+        "nlp_journal_abs_intro": {
+            "ndcg@10": 0.9611129584687909
+        },
+        "nlp_journal_title_abs": {
+            "ndcg@10": 0.9812952838148481
+        },
+        "nlp_journal_title_intro": {
+            "ndcg@10": 0.8825842093499676
+        }
+    },
+    "STS": {
+        "jsick": {
+            "spearman": 0.7464955416231873
+        },
+        "jsts": {
+            "spearman": 0.8385298782229563
+        }
+    },
+    "Clustering": {
+        "livedoor_news": {
+            "v_measure_score": 0.6039269159025831
+        },
+        "mewsc16": {
+            "v_measure_score": 0.5133038855338062
+        }
+    },
+    "PairClassification": {
+        "paws_x_ja": {
+            "binary_f1": 0.6225736879942487
+        }
+    }
+}