hpprc commited on Apr 14

Commit

b58f3a1

verified ·

1 Parent(s): 109a5cf

Upload 17 files

Browse files

Files changed (17) hide show

results-len512/Classification/scores_amazon_counterfactual_classification.json +23 -0
results-len512/Classification/scores_amazon_review_classification.json +23 -0
results-len512/Classification/scores_massive_intent_classification.json +23 -0
results-len512/Classification/scores_massive_scenario_classification.json +23 -0
results-len512/Clustering/scores_livedoor_news.json +36 -0
results-len512/Clustering/scores_mewsc16.json +36 -0
results-len512/PairClassification/scores_paws_x_ja.json +41 -0
results-len512/Reranking/scores_esci.json +31 -0
results-len512/Retrieval/scores_jagovfaqs_22k.json +43 -0
results-len512/Retrieval/scores_jaqket.json +43 -0
results-len512/Retrieval/scores_mrtydi.json +43 -0
results-len512/Retrieval/scores_nlp_journal_abs_intro.json +43 -0
results-len512/Retrieval/scores_nlp_journal_title_abs.json +43 -0
results-len512/Retrieval/scores_nlp_journal_title_intro.json +43 -0
results-len512/STS/scores_jsick.json +31 -0
results-len512/STS/scores_jsts.json +31 -0
results-len512/summary.json +62 -0

results-len512/Classification/scores_amazon_counterfactual_classification.json ADDED Viewed

	@@ -0,0 +1,23 @@

+{
+    "metric_name": "macro_f1",
+    "metric_value": 0.8283702018329007,
+    "details": {
+        "optimal_classifier_name": "logreg",
+        "val_scores": {
+            "knn_cosine_k_2": {
+                "accuracy": 0.9184549356223176,
+                "macro_f1": 0.681235599078341
+            },
+            "logreg": {
+                "accuracy": 0.927038626609442,
+                "macro_f1": 0.7726829268292683
+            }
+        },
+        "test_scores": {
+            "logreg": {
+                "accuracy": 0.9411134903640257,
+                "macro_f1": 0.8283702018329007
+            }
+        }
+    }
+}

results-len512/Classification/scores_amazon_review_classification.json ADDED Viewed

	@@ -0,0 +1,23 @@

+{
+    "metric_name": "macro_f1",
+    "metric_value": 0.5918838130358689,
+    "details": {
+        "optimal_classifier_name": "logreg",
+        "val_scores": {
+            "knn_cosine_k_2": {
+                "accuracy": 0.4536,
+                "macro_f1": 0.4460589777163412
+            },
+            "logreg": {
+                "accuracy": 0.5986,
+                "macro_f1": 0.5938685525496514
+            }
+        },
+        "test_scores": {
+            "logreg": {
+                "accuracy": 0.5964,
+                "macro_f1": 0.5918838130358689
+            }
+        }
+    }
+}

results-len512/Classification/scores_massive_intent_classification.json ADDED Viewed

	@@ -0,0 +1,23 @@

+{
+    "metric_name": "macro_f1",
+    "metric_value": 0.7849950487595191,
+    "details": {
+        "optimal_classifier_name": "logreg",
+        "val_scores": {
+            "knn_cosine_k_2": {
+                "accuracy": 0.7624200688637481,
+                "macro_f1": 0.7429537614615437
+            },
+            "logreg": {
+                "accuracy": 0.8288243974422036,
+                "macro_f1": 0.8195455157035694
+            }
+        },
+        "test_scores": {
+            "logreg": {
+                "accuracy": 0.831876260928043,
+                "macro_f1": 0.7849950487595191
+            }
+        }
+    }
+}

results-len512/Classification/scores_massive_scenario_classification.json ADDED Viewed

	@@ -0,0 +1,23 @@

+{
+    "metric_name": "macro_f1",
+    "metric_value": 0.87335723142719,
+    "details": {
+        "optimal_classifier_name": "logreg",
+        "val_scores": {
+            "knn_cosine_k_2": {
+                "accuracy": 0.8558780127889818,
+                "macro_f1": 0.8485633592400048
+            },
+            "logreg": {
+                "accuracy": 0.8691588785046729,
+                "macro_f1": 0.8625860435889454
+            }
+        },
+        "test_scores": {
+            "logreg": {
+                "accuracy": 0.8765971755211835,
+                "macro_f1": 0.87335723142719
+            }
+        }
+    }
+}

results-len512/Clustering/scores_livedoor_news.json ADDED Viewed

	@@ -0,0 +1,36 @@

+{
+    "metric_name": "v_measure_score",
+    "metric_value": 0.5408913333324076,
+    "details": {
+        "optimal_clustering_model_name": "AgglomerativeClustering",
+        "val_scores": {
+            "MiniBatchKMeans": {
+                "v_measure_score": 0.5182294367942578,
+                "homogeneity_score": 0.5083929516751572,
+                "completeness_score": 0.5284540682758625
+            },
+            "AgglomerativeClustering": {
+                "v_measure_score": 0.5895844570616736,
+                "homogeneity_score": 0.5798748360491485,
+                "completeness_score": 0.5996247778002453
+            },
+            "BisectingKMeans": {
+                "v_measure_score": 0.547905255250393,
+                "homogeneity_score": 0.544426621916416,
+                "completeness_score": 0.5514286281531552
+            },
+            "Birch": {
+                "v_measure_score": 0.5810872157931731,
+                "homogeneity_score": 0.564042246417553,
+                "completeness_score": 0.5991944609541024
+            }
+        },
+        "test_scores": {
+            "AgglomerativeClustering": {
+                "v_measure_score": 0.5408913333324076,
+                "homogeneity_score": 0.5377939657352733,
+                "completeness_score": 0.5440245855267704
+            }
+        }
+    }
+}

results-len512/Clustering/scores_mewsc16.json ADDED Viewed

	@@ -0,0 +1,36 @@

+{
+    "metric_name": "v_measure_score",
+    "metric_value": 0.5028507755536713,
+    "details": {
+        "optimal_clustering_model_name": "AgglomerativeClustering",
+        "val_scores": {
+            "MiniBatchKMeans": {
+                "v_measure_score": 0.4458851291915875,
+                "homogeneity_score": 0.48533124402844363,
+                "completeness_score": 0.4123691329066709
+            },
+            "AgglomerativeClustering": {
+                "v_measure_score": 0.49536644061268514,
+                "homogeneity_score": 0.5301463317764765,
+                "completeness_score": 0.46486902308967953
+            },
+            "BisectingKMeans": {
+                "v_measure_score": 0.43838510788950696,
+                "homogeneity_score": 0.4772898709546572,
+                "completeness_score": 0.40534472422469503
+            },
+            "Birch": {
+                "v_measure_score": 0.49419823370381905,
+                "homogeneity_score": 0.5264827004846486,
+                "completeness_score": 0.4656444327759002
+            }
+        },
+        "test_scores": {
+            "AgglomerativeClustering": {
+                "v_measure_score": 0.5028507755536713,
+                "homogeneity_score": 0.5309796320912937,
+                "completeness_score": 0.4775522554756309
+            }
+        }
+    }
+}

results-len512/PairClassification/scores_paws_x_ja.json ADDED Viewed

	@@ -0,0 +1,41 @@

+{
+    "metric_name": "binary_f1",
+    "metric_value": 0.6175182481751825,
+    "details": {
+        "optimal_distance_metric": "dot_similarities",
+        "val_scores": {
+            "cosine_distances": {
+                "accuracy": 0.5725,
+                "accuracy_threshold": 0.7122286558151245,
+                "binary_f1": 0.5979670522257273,
+                "binary_f1_threshold": 1.0
+            },
+            "manhatten_distances": {
+                "accuracy": 0.6045,
+                "accuracy_threshold": 62.02785873413086,
+                "binary_f1": 0.6016949152542372,
+                "binary_f1_threshold": 606.8050537109375
+            },
+            "euclidean_distances": {
+                "accuracy": 0.605,
+                "accuracy_threshold": 5.562343120574951,
+                "binary_f1": 0.6016949152542372,
+                "binary_f1_threshold": 40.35772705078125
+            },
+            "dot_similarities": {
+                "accuracy": 0.581,
+                "accuracy_threshold": 5684.939453125,
+                "binary_f1": 0.6050236621769203,
+                "binary_f1_threshold": 4571.8681640625
+            }
+        },
+        "test_scores": {
+            "dot_similarities": {
+                "accuracy": 0.5655,
+                "accuracy_threshold": 5684.939453125,
+                "binary_f1": 0.6175182481751825,
+                "binary_f1_threshold": 4571.8681640625
+            }
+        }
+    }
+}

results-len512/Reranking/scores_esci.json ADDED Viewed

	@@ -0,0 +1,31 @@

+{
+    "metric_name": "ndcg@10",
+    "metric_value": 0.9327252616959848,
+    "details": {
+        "optimal_distance_metric": "euclidean_distance",
+        "val_scores": {
+            "cosine_similarity": {
+                "ndcg@10": 0.9455943545908806,
+                "ndcg@20": 0.9576462577863859,
+                "ndcg@40": 0.9654667184941765
+            },
+            "dot_score": {
+                "ndcg@10": 0.9316403013236408,
+                "ndcg@20": 0.9466113531644135,
+                "ndcg@40": 0.9552590001860088
+            },
+            "euclidean_distance": {
+                "ndcg@10": 0.9461990989028242,
+                "ndcg@20": 0.9580170663788997,
+                "ndcg@40": 0.9657975841385325
+            }
+        },
+        "test_scores": {
+            "euclidean_distance": {
+                "ndcg@10": 0.9327252616959848,
+                "ndcg@20": 0.949185331338756,
+                "ndcg@40": 0.9585114997970098
+            }
+        }
+    }
+}

results-len512/Retrieval/scores_jagovfaqs_22k.json ADDED Viewed

	@@ -0,0 +1,43 @@

+{
+    "metric_name": "ndcg@10",
+    "metric_value": 0.7448082812189565,
+    "details": {
+        "optimal_distance_metric": "cosine_similarity",
+        "val_scores": {
+            "cosine_similarity": {
+                "accuracy@1": 0.6121673003802282,
+                "accuracy@3": 0.7724480842351564,
+                "accuracy@5": 0.8245100906697865,
+                "accuracy@10": 0.8724773325533782,
+                "ndcg@10": 0.7448388962984194,
+                "mrr@10": 0.703620988221749
+            },
+            "dot_score": {
+                "accuracy@1": 0.19801111436092425,
+                "accuracy@3": 0.31354197133664813,
+                "accuracy@5": 0.3606317636735888,
+                "accuracy@10": 0.4305352442234571,
+                "ndcg@10": 0.3070567565407926,
+                "mrr@10": 0.2684574297692174
+            },
+            "euclidean_distance": {
+                "accuracy@1": 0.6107048844691431,
+                "accuracy@3": 0.7744954665106757,
+                "accuracy@5": 0.8195378765720971,
+                "accuracy@10": 0.871014916642293,
+                "ndcg@10": 0.7429448986423296,
+                "mrr@10": 0.7017048751839619
+            }
+        },
+        "test_scores": {
+            "cosine_similarity": {
+                "accuracy@1": 0.612280701754386,
+                "accuracy@3": 0.776608187134503,
+                "accuracy@5": 0.8242690058479533,
+                "accuracy@10": 0.873391812865497,
+                "ndcg@10": 0.7448082812189565,
+                "mrr@10": 0.7033651257774068
+            }
+        }
+    }
+}

results-len512/Retrieval/scores_jaqket.json ADDED Viewed

	@@ -0,0 +1,43 @@

+{
+    "metric_name": "ndcg@10",
+    "metric_value": 0.6885528708504698,
+    "details": {
+        "optimal_distance_metric": "cosine_similarity",
+        "val_scores": {
+            "cosine_similarity": {
+                "accuracy@1": 0.5246231155778894,
+                "accuracy@3": 0.7195979899497488,
+                "accuracy@5": 0.771859296482412,
+                "accuracy@10": 0.8160804020100503,
+                "ndcg@10": 0.6772692193835311,
+                "mrr@10": 0.6321009810959564
+            },
+            "dot_score": {
+                "accuracy@1": 0.26532663316582916,
+                "accuracy@3": 0.46130653266331656,
+                "accuracy@5": 0.5326633165829145,
+                "accuracy@10": 0.6100502512562814,
+                "ndcg@10": 0.4344150347008597,
+                "mrr@10": 0.3784880752971205
+            },
+            "euclidean_distance": {
+                "accuracy@1": 0.5175879396984925,
+                "accuracy@3": 0.7195979899497488,
+                "accuracy@5": 0.7628140703517587,
+                "accuracy@10": 0.8110552763819096,
+                "ndcg@10": 0.671449580225242,
+                "mrr@10": 0.6259735183855789
+            }
+        },
+        "test_scores": {
+            "cosine_similarity": {
+                "accuracy@1": 0.5235707121364093,
+                "accuracy@3": 0.7291875626880642,
+                "accuracy@5": 0.7903711133400201,
+                "accuracy@10": 0.8425275827482447,
+                "ndcg@10": 0.6885528708504698,
+                "mrr@10": 0.6385633089745427
+            }
+        }
+    }
+}

results-len512/Retrieval/scores_mrtydi.json ADDED Viewed

	@@ -0,0 +1,43 @@

+{
+    "metric_name": "ndcg@10",
+    "metric_value": 0.4493143159382214,
+    "details": {
+        "optimal_distance_metric": "euclidean_distance",
+        "val_scores": {
+            "cosine_similarity": {
+                "accuracy@1": 0.3459051724137931,
+                "accuracy@3": 0.5247844827586207,
+                "accuracy@5": 0.5980603448275862,
+                "accuracy@10": 0.6896551724137931,
+                "ndcg@10": 0.510986461758995,
+                "mrr@10": 0.4545835899014776
+            },
+            "dot_score": {
+                "accuracy@1": 0.059267241379310345,
+                "accuracy@3": 0.09482758620689655,
+                "accuracy@5": 0.12284482758620689,
+                "accuracy@10": 0.16918103448275862,
+                "ndcg@10": 0.10687041620498051,
+                "mrr@10": 0.08792761357416536
+            },
+            "euclidean_distance": {
+                "accuracy@1": 0.3545258620689655,
+                "accuracy@3": 0.53125,
+                "accuracy@5": 0.6088362068965517,
+                "accuracy@10": 0.6950431034482759,
+                "ndcg@10": 0.5184937025559256,
+                "mrr@10": 0.4626274288451007
+            }
+        },
+        "test_scores": {
+            "euclidean_distance": {
+                "accuracy@1": 0.3125,
+                "accuracy@3": 0.5055555555555555,
+                "accuracy@5": 0.5875,
+                "accuracy@10": 0.6583333333333333,
+                "ndcg@10": 0.4493143159382214,
+                "mrr@10": 0.4254756393298057
+            }
+        }
+    }
+}

results-len512/Retrieval/scores_nlp_journal_abs_intro.json ADDED Viewed

	@@ -0,0 +1,43 @@

+{
+    "metric_name": "ndcg@10",
+    "metric_value": 0.9424351024345127,
+    "details": {
+        "optimal_distance_metric": "cosine_similarity",
+        "val_scores": {
+            "cosine_similarity": {
+                "accuracy@1": 0.8688524590163934,
+                "accuracy@3": 0.9508196721311475,
+                "accuracy@5": 0.9836065573770492,
+                "accuracy@10": 0.9918032786885246,
+                "ndcg@10": 0.9346504139810682,
+                "mrr@10": 0.9158014571948999
+            },
+            "dot_score": {
+                "accuracy@1": 0.5573770491803278,
+                "accuracy@3": 0.7540983606557377,
+                "accuracy@5": 0.8442622950819673,
+                "accuracy@10": 0.8934426229508197,
+                "ndcg@10": 0.732018537857895,
+                "mrr@10": 0.6797456414259695
+            },
+            "euclidean_distance": {
+                "accuracy@1": 0.860655737704918,
+                "accuracy@3": 0.9426229508196722,
+                "accuracy@5": 0.9754098360655737,
+                "accuracy@10": 0.9918032786885246,
+                "ndcg@10": 0.9290878579481767,
+                "mrr@10": 0.9086846213895394
+            }
+        },
+        "test_scores": {
+            "cosine_similarity": {
+                "accuracy@1": 0.8922764227642277,
+                "accuracy@3": 0.9634146341463414,
+                "accuracy@5": 0.9735772357723578,
+                "accuracy@10": 0.983739837398374,
+                "ndcg@10": 0.9424351024345127,
+                "mrr@10": 0.9287488708220415
+            }
+        }
+    }
+}

results-len512/Retrieval/scores_nlp_journal_title_abs.json ADDED Viewed

	@@ -0,0 +1,43 @@

+{
+    "metric_name": "ndcg@10",
+    "metric_value": 0.9717579001048733,
+    "details": {
+        "optimal_distance_metric": "cosine_similarity",
+        "val_scores": {
+            "cosine_similarity": {
+                "accuracy@1": 0.9590163934426229,
+                "accuracy@3": 0.9754098360655737,
+                "accuracy@5": 0.9918032786885246,
+                "accuracy@10": 0.9918032786885246,
+                "ndcg@10": 0.9749873698268802,
+                "mrr@10": 0.969535519125683
+            },
+            "dot_score": {
+                "accuracy@1": 0.6147540983606558,
+                "accuracy@3": 0.8360655737704918,
+                "accuracy@5": 0.9262295081967213,
+                "accuracy@10": 0.9426229508196722,
+                "ndcg@10": 0.7917119670702584,
+                "mrr@10": 0.741471506635441
+            },
+            "euclidean_distance": {
+                "accuracy@1": 0.9426229508196722,
+                "accuracy@3": 0.9672131147540983,
+                "accuracy@5": 0.9918032786885246,
+                "accuracy@10": 0.9918032786885246,
+                "ndcg@10": 0.967654829355435,
+                "mrr@10": 0.9596994535519126
+            }
+        },
+        "test_scores": {
+            "cosine_similarity": {
+                "accuracy@1": 0.943089430894309,
+                "accuracy@3": 0.9857723577235772,
+                "accuracy@5": 0.9857723577235772,
+                "accuracy@10": 0.9939024390243902,
+                "ndcg@10": 0.9717579001048733,
+                "mrr@10": 0.9643341076267905
+            }
+        }
+    }
+}

results-len512/Retrieval/scores_nlp_journal_title_intro.json ADDED Viewed

	@@ -0,0 +1,43 @@

+{
+    "metric_name": "ndcg@10",
+    "metric_value": 0.8658442146344819,
+    "details": {
+        "optimal_distance_metric": "cosine_similarity",
+        "val_scores": {
+            "cosine_similarity": {
+                "accuracy@1": 0.8032786885245902,
+                "accuracy@3": 0.8770491803278688,
+                "accuracy@5": 0.9098360655737705,
+                "accuracy@10": 0.9590163934426229,
+                "ndcg@10": 0.8757852803420108,
+                "mrr@10": 0.8499772313296904
+            },
+            "dot_score": {
+                "accuracy@1": 0.45081967213114754,
+                "accuracy@3": 0.639344262295082,
+                "accuracy@5": 0.6721311475409836,
+                "accuracy@10": 0.8442622950819673,
+                "ndcg@10": 0.6300409997364643,
+                "mrr@10": 0.5643605256310176
+            },
+            "euclidean_distance": {
+                "accuracy@1": 0.7786885245901639,
+                "accuracy@3": 0.8934426229508197,
+                "accuracy@5": 0.9180327868852459,
+                "accuracy@10": 0.9344262295081968,
+                "ndcg@10": 0.8618655596809651,
+                "mrr@10": 0.8380692167577413
+            }
+        },
+        "test_scores": {
+            "cosine_similarity": {
+                "accuracy@1": 0.7703252032520326,
+                "accuracy@3": 0.8963414634146342,
+                "accuracy@5": 0.9186991869918699,
+                "accuracy@10": 0.9532520325203252,
+                "ndcg@10": 0.8658442146344819,
+                "mrr@10": 0.8374032133178474
+            }
+        }
+    }
+}

results-len512/STS/scores_jsick.json ADDED Viewed

	@@ -0,0 +1,31 @@

+{
+    "metric_name": "spearman",
+    "metric_value": 0.7584805993730833,
+    "details": {
+        "optimal_similarity_metric": "cosine_similarity",
+        "val_scores": {
+            "cosine_similarity": {
+                "pearson": 0.7966088937878548,
+                "spearman": 0.773834909663934
+            },
+            "manhatten_distance": {
+                "pearson": 0.7970989581874747,
+                "spearman": 0.7675081650433571
+            },
+            "euclidean_distance": {
+                "pearson": 0.7970989581874747,
+                "spearman": 0.7675081650433571
+            },
+            "dot_score": {
+                "pearson": 0.6592758306884232,
+                "spearman": 0.6290995800692494
+            }
+        },
+        "test_scores": {
+            "cosine_similarity": {
+                "pearson": 0.7868922847118196,
+                "spearman": 0.7584805993730833
+            }
+        }
+    }
+}

results-len512/STS/scores_jsts.json ADDED Viewed

	@@ -0,0 +1,31 @@

+{
+    "metric_name": "spearman",
+    "metric_value": 0.8379533343977638,
+    "details": {
+        "optimal_similarity_metric": "manhatten_distance",
+        "val_scores": {
+            "cosine_similarity": {
+                "pearson": 0.8437311194400292,
+                "spearman": 0.8061512891309451
+            },
+            "manhatten_distance": {
+                "pearson": 0.8523096056447624,
+                "spearman": 0.8118722694367242
+            },
+            "euclidean_distance": {
+                "pearson": 0.8523096056447624,
+                "spearman": 0.8118722694367242
+            },
+            "dot_score": {
+                "pearson": 0.6225164078211387,
+                "spearman": 0.5546034194858964
+            }
+        },
+        "test_scores": {
+            "manhatten_distance": {
+                "pearson": 0.8750484734396219,
+                "spearman": 0.8379533343977638
+            }
+        }
+    }
+}

results-len512/summary.json ADDED Viewed

	@@ -0,0 +1,62 @@

+{
+    "Classification": {
+        "amazon_counterfactual_classification": {
+            "macro_f1": 0.8283702018329007
+        },
+        "amazon_review_classification": {
+            "macro_f1": 0.5918838130358689
+        },
+        "massive_intent_classification": {
+            "macro_f1": 0.7849950487595191
+        },
+        "massive_scenario_classification": {
+            "macro_f1": 0.87335723142719
+        }
+    },
+    "Reranking": {
+        "esci": {
+            "ndcg@10": 0.9327252616959848
+        }
+    },
+    "Retrieval": {
+        "jagovfaqs_22k": {
+            "ndcg@10": 0.7448082812189565
+        },
+        "jaqket": {
+            "ndcg@10": 0.6885528708504698
+        },
+        "mrtydi": {
+            "ndcg@10": 0.4493143159382214
+        },
+        "nlp_journal_abs_intro": {
+            "ndcg@10": 0.9424351024345127
+        },
+        "nlp_journal_title_abs": {
+            "ndcg@10": 0.9717579001048733
+        },
+        "nlp_journal_title_intro": {
+            "ndcg@10": 0.8658442146344819
+        }
+    },
+    "STS": {
+        "jsick": {
+            "spearman": 0.7584805993730833
+        },
+        "jsts": {
+            "spearman": 0.8379533343977638
+        }
+    },
+    "Clustering": {
+        "livedoor_news": {
+            "v_measure_score": 0.5408913333324076
+        },
+        "mewsc16": {
+            "v_measure_score": 0.5028507755536713
+        }
+    },
+    "PairClassification": {
+        "paws_x_ja": {
+            "binary_f1": 0.6175182481751825
+        }
+    }
+}