Add files using upload-large-folder tool
Browse files- config.json +192 -0
- eval_results/eval_mldr.md +19 -0
- eval_results/mldr/baselines/mldr_en_original/eval_summary.json +21 -0
- eval_results/mldr/baselines/mldr_en_original/eval_summary.md +19 -0
- eval_results/mldr/baselines/mldr_ja_original/eval_summary.json +21 -0
- eval_results/mldr/baselines/mldr_ja_original/eval_summary.md +19 -0
- eval_results/mldr/baselines/naver-provence-reranker-debertav3-v1_mldr_en_th_0_05/eval_summary.json +21 -0
- eval_results/mldr/baselines/naver-provence-reranker-debertav3-v1_mldr_en_th_0_05/eval_summary.md +19 -0
- eval_results/mldr/baselines/naver-provence-reranker-debertav3-v1_mldr_en_th_0_05/process_summary.json +17 -0
- eval_results/mldr/baselines/naver-provence-reranker-debertav3-v1_mldr_en_th_0_1/eval_summary.json +21 -0
- eval_results/mldr/baselines/naver-provence-reranker-debertav3-v1_mldr_en_th_0_1/eval_summary.md +19 -0
- eval_results/mldr/baselines/naver-provence-reranker-debertav3-v1_mldr_en_th_0_2/eval_summary.json +21 -0
- eval_results/mldr/baselines/naver-provence-reranker-debertav3-v1_mldr_en_th_0_2/eval_summary.md +19 -0
- eval_results/mldr/baselines/naver-provence-reranker-debertav3-v1_mldr_en_th_0_5/eval_summary.json +21 -0
- eval_results/mldr/baselines/naver-provence-reranker-debertav3-v1_mldr_en_th_0_5/eval_summary.md +19 -0
- eval_results/mldr/en_th_0_05/eval_summary.json +21 -0
- eval_results/mldr/en_th_0_05/eval_summary.md +19 -0
- eval_results/mldr/en_th_0_05/process_summary.json +17 -0
- eval_results/mldr/en_th_0_1/eval_summary.json +21 -0
- eval_results/mldr/en_th_0_1/eval_summary.md +19 -0
- eval_results/mldr/en_th_0_1/process_summary.json +17 -0
- eval_results/mldr/en_th_0_3/eval_summary.json +21 -0
- eval_results/mldr/en_th_0_3/eval_summary.md +19 -0
- eval_results/mldr/en_th_0_3/process_summary.json +17 -0
- eval_results/mldr/en_th_0_5/eval_summary.json +21 -0
- eval_results/mldr/en_th_0_5/eval_summary.md +19 -0
- eval_results/mldr/en_th_0_5/process_summary.json +17 -0
- eval_results/naver-provence-reranker-debertav3-v1_mldr_en_th_0_1.md +17 -0
- eval_results/naver-xprovence-reranker-bgem3-v1_mldr_en_th_0_3.md +17 -0
- model.safetensors +3 -0
- modeling_open_provence_standalone.py +0 -0
- special_tokens_map.json +37 -0
- tokenizer.json +0 -0
- tokenizer_config.json +952 -0
- training_args.json +200 -0
config.json
ADDED
|
@@ -0,0 +1,192 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"architectures": [
|
| 3 |
+
"OpenProvenceForSequenceClassification"
|
| 4 |
+
],
|
| 5 |
+
"auto_map": {
|
| 6 |
+
"AutoConfig": "modeling_open_provence_standalone.OpenProvenceConfig",
|
| 7 |
+
"AutoModel": "modeling_open_provence_standalone.OpenProvenceForSequenceClassification",
|
| 8 |
+
"AutoModelForSequenceClassification": "modeling_open_provence_standalone.OpenProvenceForSequenceClassification",
|
| 9 |
+
"AutoModelForTokenClassification": "modeling_open_provence_standalone.OpenProvenceForTokenClassification"
|
| 10 |
+
},
|
| 11 |
+
"base_model_config": {
|
| 12 |
+
"_name_or_path": "Alibaba-NLP/gte-reranker-modernbert-base",
|
| 13 |
+
"add_cross_attention": false,
|
| 14 |
+
"architectures": [
|
| 15 |
+
"ModernBertForSequenceClassification"
|
| 16 |
+
],
|
| 17 |
+
"attention_bias": false,
|
| 18 |
+
"attention_dropout": 0.0,
|
| 19 |
+
"bad_words_ids": null,
|
| 20 |
+
"begin_suppress_tokens": null,
|
| 21 |
+
"bos_token_id": 50281,
|
| 22 |
+
"chunk_size_feed_forward": 0,
|
| 23 |
+
"classifier_activation": "gelu",
|
| 24 |
+
"classifier_bias": false,
|
| 25 |
+
"classifier_dropout": 0.0,
|
| 26 |
+
"classifier_pooling": "mean",
|
| 27 |
+
"cls_token_id": 50281,
|
| 28 |
+
"cross_attention_hidden_size": null,
|
| 29 |
+
"decoder_bias": true,
|
| 30 |
+
"decoder_start_token_id": null,
|
| 31 |
+
"deterministic_flash_attn": false,
|
| 32 |
+
"diversity_penalty": 0.0,
|
| 33 |
+
"do_sample": false,
|
| 34 |
+
"dtype": "float32",
|
| 35 |
+
"early_stopping": false,
|
| 36 |
+
"embedding_dropout": 0.0,
|
| 37 |
+
"encoder_no_repeat_ngram_size": 0,
|
| 38 |
+
"eos_token_id": 50282,
|
| 39 |
+
"exponential_decay_length_penalty": null,
|
| 40 |
+
"finetuning_task": null,
|
| 41 |
+
"forced_bos_token_id": null,
|
| 42 |
+
"forced_eos_token_id": null,
|
| 43 |
+
"global_attn_every_n_layers": 3,
|
| 44 |
+
"global_rope_theta": 160000.0,
|
| 45 |
+
"gradient_checkpointing": false,
|
| 46 |
+
"hidden_activation": "gelu",
|
| 47 |
+
"hidden_size": 768,
|
| 48 |
+
"id2label": {
|
| 49 |
+
"0": "LABEL_0"
|
| 50 |
+
},
|
| 51 |
+
"initializer_cutoff_factor": 2.0,
|
| 52 |
+
"initializer_range": 0.02,
|
| 53 |
+
"intermediate_size": 1152,
|
| 54 |
+
"is_decoder": false,
|
| 55 |
+
"is_encoder_decoder": false,
|
| 56 |
+
"label2id": {
|
| 57 |
+
"LABEL_0": 0
|
| 58 |
+
},
|
| 59 |
+
"layer_norm_eps": 1e-05,
|
| 60 |
+
"length_penalty": 1.0,
|
| 61 |
+
"local_attention": 128,
|
| 62 |
+
"local_rope_theta": 10000.0,
|
| 63 |
+
"max_length": 20,
|
| 64 |
+
"max_position_embeddings": 8192,
|
| 65 |
+
"min_length": 0,
|
| 66 |
+
"mlp_bias": false,
|
| 67 |
+
"mlp_dropout": 0.0,
|
| 68 |
+
"model_type": "modernbert",
|
| 69 |
+
"no_repeat_ngram_size": 0,
|
| 70 |
+
"norm_bias": false,
|
| 71 |
+
"norm_eps": 1e-05,
|
| 72 |
+
"num_attention_heads": 12,
|
| 73 |
+
"num_beam_groups": 1,
|
| 74 |
+
"num_beams": 1,
|
| 75 |
+
"num_hidden_layers": 22,
|
| 76 |
+
"num_return_sequences": 1,
|
| 77 |
+
"output_attentions": false,
|
| 78 |
+
"output_hidden_states": false,
|
| 79 |
+
"output_scores": false,
|
| 80 |
+
"pad_token_id": 50283,
|
| 81 |
+
"position_embedding_type": "absolute",
|
| 82 |
+
"prefix": null,
|
| 83 |
+
"problem_type": null,
|
| 84 |
+
"pruned_heads": {},
|
| 85 |
+
"remove_invalid_values": false,
|
| 86 |
+
"repad_logits_with_grad": false,
|
| 87 |
+
"repetition_penalty": 1.0,
|
| 88 |
+
"return_dict": true,
|
| 89 |
+
"return_dict_in_generate": false,
|
| 90 |
+
"sep_token_id": 50282,
|
| 91 |
+
"sparse_pred_ignore_index": -100,
|
| 92 |
+
"sparse_prediction": false,
|
| 93 |
+
"suppress_tokens": null,
|
| 94 |
+
"task_specific_params": null,
|
| 95 |
+
"temperature": 1.0,
|
| 96 |
+
"tf_legacy_loss": false,
|
| 97 |
+
"tie_encoder_decoder": false,
|
| 98 |
+
"tie_word_embeddings": true,
|
| 99 |
+
"tokenizer_class": null,
|
| 100 |
+
"top_k": 50,
|
| 101 |
+
"top_p": 1.0,
|
| 102 |
+
"torchscript": false,
|
| 103 |
+
"transformers_version": "4.57.1",
|
| 104 |
+
"typical_p": 1.0,
|
| 105 |
+
"use_bfloat16": false,
|
| 106 |
+
"vocab_size": 50368
|
| 107 |
+
},
|
| 108 |
+
"base_model_name_or_path": "Alibaba-NLP/gte-reranker-modernbert-base",
|
| 109 |
+
"encoder_architecture": "modernbert",
|
| 110 |
+
"hidden_size": 768,
|
| 111 |
+
"id2label": {
|
| 112 |
+
"0": "LABEL_0"
|
| 113 |
+
},
|
| 114 |
+
"label2id": {
|
| 115 |
+
"LABEL_0": 0
|
| 116 |
+
},
|
| 117 |
+
"max_length": 512,
|
| 118 |
+
"mode": "reranking_pruning",
|
| 119 |
+
"model_type": "open_provence",
|
| 120 |
+
"num_pruning_labels": 2,
|
| 121 |
+
"pruning_config": {
|
| 122 |
+
"_name_or_path": "",
|
| 123 |
+
"add_cross_attention": false,
|
| 124 |
+
"architectures": null,
|
| 125 |
+
"bad_words_ids": null,
|
| 126 |
+
"begin_suppress_tokens": null,
|
| 127 |
+
"bos_token_id": null,
|
| 128 |
+
"chunk_size_feed_forward": 0,
|
| 129 |
+
"classifier_dropout": 0.0,
|
| 130 |
+
"cross_attention_hidden_size": null,
|
| 131 |
+
"decoder_start_token_id": null,
|
| 132 |
+
"diversity_penalty": 0.0,
|
| 133 |
+
"do_sample": false,
|
| 134 |
+
"dtype": null,
|
| 135 |
+
"early_stopping": false,
|
| 136 |
+
"encoder_no_repeat_ngram_size": 0,
|
| 137 |
+
"eos_token_id": null,
|
| 138 |
+
"exponential_decay_length_penalty": null,
|
| 139 |
+
"finetuning_task": null,
|
| 140 |
+
"forced_bos_token_id": null,
|
| 141 |
+
"forced_eos_token_id": null,
|
| 142 |
+
"hidden_size": 768,
|
| 143 |
+
"id2label": {
|
| 144 |
+
"0": "LABEL_0",
|
| 145 |
+
"1": "LABEL_1"
|
| 146 |
+
},
|
| 147 |
+
"is_decoder": false,
|
| 148 |
+
"is_encoder_decoder": false,
|
| 149 |
+
"label2id": {
|
| 150 |
+
"LABEL_0": 0,
|
| 151 |
+
"LABEL_1": 1
|
| 152 |
+
},
|
| 153 |
+
"length_penalty": 1.0,
|
| 154 |
+
"max_length": 20,
|
| 155 |
+
"min_length": 0,
|
| 156 |
+
"model_type": "open_provence_head",
|
| 157 |
+
"no_repeat_ngram_size": 0,
|
| 158 |
+
"num_beam_groups": 1,
|
| 159 |
+
"num_beams": 1,
|
| 160 |
+
"num_return_sequences": 1,
|
| 161 |
+
"output_attentions": false,
|
| 162 |
+
"output_hidden_states": false,
|
| 163 |
+
"output_scores": false,
|
| 164 |
+
"pad_token_id": null,
|
| 165 |
+
"prefix": null,
|
| 166 |
+
"problem_type": null,
|
| 167 |
+
"pruned_heads": {},
|
| 168 |
+
"remove_invalid_values": false,
|
| 169 |
+
"repetition_penalty": 1.0,
|
| 170 |
+
"return_dict": true,
|
| 171 |
+
"return_dict_in_generate": false,
|
| 172 |
+
"sentence_pooling": "mean",
|
| 173 |
+
"sep_token_id": null,
|
| 174 |
+
"suppress_tokens": null,
|
| 175 |
+
"task_specific_params": null,
|
| 176 |
+
"temperature": 1.0,
|
| 177 |
+
"tf_legacy_loss": false,
|
| 178 |
+
"tie_encoder_decoder": false,
|
| 179 |
+
"tie_word_embeddings": true,
|
| 180 |
+
"tokenizer_class": null,
|
| 181 |
+
"top_k": 50,
|
| 182 |
+
"top_p": 1.0,
|
| 183 |
+
"torchscript": false,
|
| 184 |
+
"transformers_version": "4.57.1",
|
| 185 |
+
"typical_p": 1.0,
|
| 186 |
+
"use_bfloat16": false,
|
| 187 |
+
"use_weighted_pooling": false
|
| 188 |
+
},
|
| 189 |
+
"tokenizer_name_or_path": null,
|
| 190 |
+
"transformers_version": "4.57.1",
|
| 191 |
+
"vocab_size": 50368
|
| 192 |
+
}
|
eval_results/eval_mldr.md
ADDED
|
@@ -0,0 +1,19 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# MLDR Evaluation Summary — open-provence-reranker-v1
|
| 2 |
+
|
| 3 |
+
## English (en) — refreshed 2025-10-27
|
| 4 |
+
|
| 5 |
+
| Threshold | Has Answer (1) | Has Answer (0) | Failed | Score Mean | Median | Min | Max | Process Time (s) | Eval Time (s) |
|
| 6 |
+
| --- | ---:| ---:| ---:| ---:| ---:| ---:| ---:| ---:| ---:|
|
| 7 |
+
| 0.1 | 164 | 10 | 0 | 0.9354 | 1.0000 | 0.0000 | 1.0000 | 249.06 | 43.89 |
|
| 8 |
+
| 0.2 | 158 | 16 | 0 | 0.9025 | 1.0000 | 0.0000 | 1.0000 | 251.30 | 38.25 |
|
| 9 |
+
| 0.3 | 161 | 13 | 0 | 0.9165 | 1.0000 | 0.0000 | 1.0000 | 260.52 | 34.87 |
|
| 10 |
+
| 0.5 | 152 | 22 | 0 | 0.8645 | 1.0000 | 0.0000 | 1.0000 | 254.43 | 35.69 |
|
| 11 |
+
|
| 12 |
+
### Original Text (no pruning)
|
| 13 |
+
|
| 14 |
+
- Has Answer (1): 163
|
| 15 |
+
- Has Answer (0): 11
|
| 16 |
+
- Failed: 0
|
| 17 |
+
- Answer score mean/median/min/max: 0.9328 / 1.0000 / 0.0000 / 1.0000
|
| 18 |
+
- Process time (s): 4.27
|
| 19 |
+
- LLM eval time (s): 227.76
|
eval_results/mldr/baselines/mldr_en_original/eval_summary.json
ADDED
|
@@ -0,0 +1,21 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"input_dataset": "/home/hotchpotch/src/github.com/hotchpotch/open_provence/tmp/mldr_runs/open-provence-reranker-v1/mldr_en_original/process_original/dataset",
|
| 3 |
+
"language": "en",
|
| 4 |
+
"llm_model": "gpt-5-nano",
|
| 5 |
+
"reasoning_effort": "low",
|
| 6 |
+
"records_evaluated": 174,
|
| 7 |
+
"ignored_count": 208,
|
| 8 |
+
"counts": {
|
| 9 |
+
"has_answer_1": 163,
|
| 10 |
+
"has_answer_0": 11,
|
| 11 |
+
"failed": 0
|
| 12 |
+
},
|
| 13 |
+
"answer_score_stats": {
|
| 14 |
+
"mean": 0.9281034482758621,
|
| 15 |
+
"median": 1.0,
|
| 16 |
+
"min": 0.0,
|
| 17 |
+
"max": 1.0
|
| 18 |
+
},
|
| 19 |
+
"process_time_seconds": 3.4119314670097083,
|
| 20 |
+
"evaluation_time_seconds": 98.81951962405583
|
| 21 |
+
}
|
eval_results/mldr/baselines/mldr_en_original/eval_summary.md
ADDED
|
@@ -0,0 +1,19 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# LLM Evaluation Summary
|
| 2 |
+
|
| 3 |
+
- Dataset: `/home/hotchpotch/src/github.com/hotchpotch/open_provence/tmp/mldr_runs/open-provence-reranker-v1/mldr_en_original/process_original/dataset`
|
| 4 |
+
- Language: en
|
| 5 |
+
- LLM model: gpt-5-nano
|
| 6 |
+
- Reasoning effort: low
|
| 7 |
+
- Records evaluated: 174
|
| 8 |
+
- Ignored queries: 208
|
| 9 |
+
- Has answer (1): 163
|
| 10 |
+
- Has answer (0): 11
|
| 11 |
+
- Failed: 0
|
| 12 |
+
- Process time (s): 3.41
|
| 13 |
+
- LLM eval time (s): 98.82
|
| 14 |
+
|
| 15 |
+
## Answer Score Statistics
|
| 16 |
+
- mean: 0.9281
|
| 17 |
+
- median: 1.0000
|
| 18 |
+
- min: 0.0000
|
| 19 |
+
- max: 1.0000
|
eval_results/mldr/baselines/mldr_ja_original/eval_summary.json
ADDED
|
@@ -0,0 +1,21 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"input_dataset": "/home/hotchpotch/src/github.com/hotchpotch/open_provence/tmp/mldr_runs/open-provence-reranker-japanese-v1/mldr_ja_original/process_original/dataset",
|
| 3 |
+
"language": "jp",
|
| 4 |
+
"llm_model": "gpt-5-nano",
|
| 5 |
+
"reasoning_effort": "low",
|
| 6 |
+
"records_evaluated": 166,
|
| 7 |
+
"ignored_count": 272,
|
| 8 |
+
"counts": {
|
| 9 |
+
"has_answer_1": 129,
|
| 10 |
+
"has_answer_0": 37,
|
| 11 |
+
"failed": 0
|
| 12 |
+
},
|
| 13 |
+
"answer_score_stats": {
|
| 14 |
+
"mean": 0.734578313253012,
|
| 15 |
+
"median": 0.9,
|
| 16 |
+
"min": 0.0,
|
| 17 |
+
"max": 1.0
|
| 18 |
+
},
|
| 19 |
+
"process_time_seconds": 2.720734969014302,
|
| 20 |
+
"evaluation_time_seconds": 169.58438874501735
|
| 21 |
+
}
|
eval_results/mldr/baselines/mldr_ja_original/eval_summary.md
ADDED
|
@@ -0,0 +1,19 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# LLM Evaluation Summary
|
| 2 |
+
|
| 3 |
+
- Dataset: `/home/hotchpotch/src/github.com/hotchpotch/open_provence/tmp/mldr_runs/open-provence-reranker-japanese-v1/mldr_ja_original/process_original/dataset`
|
| 4 |
+
- Language: jp
|
| 5 |
+
- LLM model: gpt-5-nano
|
| 6 |
+
- Reasoning effort: low
|
| 7 |
+
- Records evaluated: 166
|
| 8 |
+
- Ignored queries: 272
|
| 9 |
+
- Has answer (1): 129
|
| 10 |
+
- Has answer (0): 37
|
| 11 |
+
- Failed: 0
|
| 12 |
+
- Process time (s): 2.72
|
| 13 |
+
- LLM eval time (s): 169.58
|
| 14 |
+
|
| 15 |
+
## Answer Score Statistics
|
| 16 |
+
- mean: 0.7346
|
| 17 |
+
- median: 0.9000
|
| 18 |
+
- min: 0.0000
|
| 19 |
+
- max: 1.0000
|
eval_results/mldr/baselines/naver-provence-reranker-debertav3-v1_mldr_en_th_0_05/eval_summary.json
ADDED
|
@@ -0,0 +1,21 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"input_dataset": "/home/hotchpotch/src/github.com/hotchpotch/open_provence/tmp/naver-provence-reranker-eval/naver-provence-reranker-debertav3-v1_mldr_en_th_0_05/run1/process/dataset",
|
| 3 |
+
"language": "en",
|
| 4 |
+
"llm_model": "gpt-5-nano",
|
| 5 |
+
"reasoning_effort": "low",
|
| 6 |
+
"records_evaluated": 174,
|
| 7 |
+
"ignored_count": 208,
|
| 8 |
+
"counts": {
|
| 9 |
+
"has_answer_1": 162,
|
| 10 |
+
"has_answer_0": 12,
|
| 11 |
+
"failed": 0
|
| 12 |
+
},
|
| 13 |
+
"answer_score_stats": {
|
| 14 |
+
"mean": 0.9173563218390804,
|
| 15 |
+
"median": 1.0,
|
| 16 |
+
"min": 0.0,
|
| 17 |
+
"max": 1.0
|
| 18 |
+
},
|
| 19 |
+
"process_time_seconds": 380.79417042899877,
|
| 20 |
+
"evaluation_time_seconds": 29.97553447500104
|
| 21 |
+
}
|
eval_results/mldr/baselines/naver-provence-reranker-debertav3-v1_mldr_en_th_0_05/eval_summary.md
ADDED
|
@@ -0,0 +1,19 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# LLM Evaluation Summary
|
| 2 |
+
|
| 3 |
+
- Dataset: `/home/hotchpotch/src/github.com/hotchpotch/open_provence/tmp/naver-provence-reranker-eval/naver-provence-reranker-debertav3-v1_mldr_en_th_0_05/run1/process/dataset`
|
| 4 |
+
- Language: en
|
| 5 |
+
- LLM model: gpt-5-nano
|
| 6 |
+
- Reasoning effort: low
|
| 7 |
+
- Records evaluated: 174
|
| 8 |
+
- Ignored queries: 208
|
| 9 |
+
- Has answer (1): 162
|
| 10 |
+
- Has answer (0): 12
|
| 11 |
+
- Failed: 0
|
| 12 |
+
- Process time (s): 380.79
|
| 13 |
+
- LLM eval time (s): 29.98
|
| 14 |
+
|
| 15 |
+
## Answer Score Statistics
|
| 16 |
+
- mean: 0.9174
|
| 17 |
+
- median: 1.0000
|
| 18 |
+
- min: 0.0000
|
| 19 |
+
- max: 1.0000
|
eval_results/mldr/baselines/naver-provence-reranker-debertav3-v1_mldr_en_th_0_05/process_summary.json
ADDED
|
@@ -0,0 +1,17 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"limit": 200,
|
| 3 |
+
"threshold": 0.05,
|
| 4 |
+
"num_records": 1600,
|
| 5 |
+
"num_queries": 200,
|
| 6 |
+
"dataset_language": "en",
|
| 7 |
+
"splitter_language": "en",
|
| 8 |
+
"max_length": null,
|
| 9 |
+
"model": "naver/provence-reranker-debertav3-v1",
|
| 10 |
+
"naver_provence_model": true,
|
| 11 |
+
"avg_pos_score": -6.5308984375,
|
| 12 |
+
"avg_neg_score": -10.574609375,
|
| 13 |
+
"avg_pos_compression": 92.10123209994308,
|
| 14 |
+
"avg_neg_compression": 99.15497159939561,
|
| 15 |
+
"source_text": "pruned",
|
| 16 |
+
"process_time_seconds": 380.79417042899877
|
| 17 |
+
}
|
eval_results/mldr/baselines/naver-provence-reranker-debertav3-v1_mldr_en_th_0_1/eval_summary.json
ADDED
|
@@ -0,0 +1,21 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"input_dataset": "/home/hotchpotch/src/github.com/hotchpotch/open_provence/tmp/naver-provence-reranker-eval/naver-provence-reranker-debertav3-v1_mldr_en_th_0_1/process/dataset",
|
| 3 |
+
"language": "en",
|
| 4 |
+
"llm_model": "gpt-5-nano",
|
| 5 |
+
"reasoning_effort": "low",
|
| 6 |
+
"records_evaluated": 174,
|
| 7 |
+
"ignored_count": 208,
|
| 8 |
+
"counts": {
|
| 9 |
+
"has_answer_1": 162,
|
| 10 |
+
"has_answer_0": 12,
|
| 11 |
+
"failed": 0
|
| 12 |
+
},
|
| 13 |
+
"answer_score_stats": {
|
| 14 |
+
"mean": 0.9153448275862069,
|
| 15 |
+
"median": 1.0,
|
| 16 |
+
"min": 0.0,
|
| 17 |
+
"max": 1.0
|
| 18 |
+
},
|
| 19 |
+
"process_time_seconds": 389.7323627329897,
|
| 20 |
+
"evaluation_time_seconds": 190.08830377610866
|
| 21 |
+
}
|
eval_results/mldr/baselines/naver-provence-reranker-debertav3-v1_mldr_en_th_0_1/eval_summary.md
ADDED
|
@@ -0,0 +1,19 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# LLM Evaluation Summary
|
| 2 |
+
|
| 3 |
+
- Dataset: `/home/hotchpotch/src/github.com/hotchpotch/open_provence/tmp/naver-provence-reranker-eval/naver-provence-reranker-debertav3-v1_mldr_en_th_0_1/process/dataset`
|
| 4 |
+
- Language: en
|
| 5 |
+
- LLM model: gpt-5-nano
|
| 6 |
+
- Reasoning effort: low
|
| 7 |
+
- Records evaluated: 174
|
| 8 |
+
- Ignored queries: 208
|
| 9 |
+
- Has answer (1): 162
|
| 10 |
+
- Has answer (0): 12
|
| 11 |
+
- Failed: 0
|
| 12 |
+
- Process time (s): 389.73
|
| 13 |
+
- LLM eval time (s): 190.09
|
| 14 |
+
|
| 15 |
+
## Answer Score Statistics
|
| 16 |
+
- mean: 0.9153
|
| 17 |
+
- median: 1.0000
|
| 18 |
+
- min: 0.0000
|
| 19 |
+
- max: 1.0000
|
eval_results/mldr/baselines/naver-provence-reranker-debertav3-v1_mldr_en_th_0_2/eval_summary.json
ADDED
|
@@ -0,0 +1,21 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"input_dataset": "/home/hotchpotch/src/github.com/hotchpotch/open_provence/tmp/naver-provence-reranker-eval/naver-provence-reranker-debertav3-v1_mldr_en_th_0_2/process/dataset",
|
| 3 |
+
"language": "en",
|
| 4 |
+
"llm_model": "gpt-5-nano",
|
| 5 |
+
"reasoning_effort": "low",
|
| 6 |
+
"records_evaluated": 174,
|
| 7 |
+
"ignored_count": 208,
|
| 8 |
+
"counts": {
|
| 9 |
+
"has_answer_1": 157,
|
| 10 |
+
"has_answer_0": 17,
|
| 11 |
+
"failed": 0
|
| 12 |
+
},
|
| 13 |
+
"answer_score_stats": {
|
| 14 |
+
"mean": 0.8882758620689656,
|
| 15 |
+
"median": 1.0,
|
| 16 |
+
"min": 0.0,
|
| 17 |
+
"max": 1.0
|
| 18 |
+
},
|
| 19 |
+
"process_time_seconds": 392.35378917702474,
|
| 20 |
+
"evaluation_time_seconds": 187.29701190802734
|
| 21 |
+
}
|
eval_results/mldr/baselines/naver-provence-reranker-debertav3-v1_mldr_en_th_0_2/eval_summary.md
ADDED
|
@@ -0,0 +1,19 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# LLM Evaluation Summary
|
| 2 |
+
|
| 3 |
+
- Dataset: `/home/hotchpotch/src/github.com/hotchpotch/open_provence/tmp/naver-provence-reranker-eval/naver-provence-reranker-debertav3-v1_mldr_en_th_0_2/process/dataset`
|
| 4 |
+
- Language: en
|
| 5 |
+
- LLM model: gpt-5-nano
|
| 6 |
+
- Reasoning effort: low
|
| 7 |
+
- Records evaluated: 174
|
| 8 |
+
- Ignored queries: 208
|
| 9 |
+
- Has answer (1): 157
|
| 10 |
+
- Has answer (0): 17
|
| 11 |
+
- Failed: 0
|
| 12 |
+
- Process time (s): 392.35
|
| 13 |
+
- LLM eval time (s): 187.30
|
| 14 |
+
|
| 15 |
+
## Answer Score Statistics
|
| 16 |
+
- mean: 0.8883
|
| 17 |
+
- median: 1.0000
|
| 18 |
+
- min: 0.0000
|
| 19 |
+
- max: 1.0000
|
eval_results/mldr/baselines/naver-provence-reranker-debertav3-v1_mldr_en_th_0_5/eval_summary.json
ADDED
|
@@ -0,0 +1,21 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"input_dataset": "/home/hotchpotch/src/github.com/hotchpotch/open_provence/tmp/naver-provence-reranker-eval/naver-provence-reranker-debertav3-v1_mldr_en_th_0_5/process/dataset",
|
| 3 |
+
"language": "en",
|
| 4 |
+
"llm_model": "gpt-5-nano",
|
| 5 |
+
"reasoning_effort": "low",
|
| 6 |
+
"records_evaluated": 174,
|
| 7 |
+
"ignored_count": 208,
|
| 8 |
+
"counts": {
|
| 9 |
+
"has_answer_1": 147,
|
| 10 |
+
"has_answer_0": 27,
|
| 11 |
+
"failed": 0
|
| 12 |
+
},
|
| 13 |
+
"answer_score_stats": {
|
| 14 |
+
"mean": 0.8420114942528735,
|
| 15 |
+
"median": 1.0,
|
| 16 |
+
"min": 0.0,
|
| 17 |
+
"max": 1.0
|
| 18 |
+
},
|
| 19 |
+
"process_time_seconds": 391.33639042195864,
|
| 20 |
+
"evaluation_time_seconds": 181.43732876703143
|
| 21 |
+
}
|
eval_results/mldr/baselines/naver-provence-reranker-debertav3-v1_mldr_en_th_0_5/eval_summary.md
ADDED
|
@@ -0,0 +1,19 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# LLM Evaluation Summary
|
| 2 |
+
|
| 3 |
+
- Dataset: `/home/hotchpotch/src/github.com/hotchpotch/open_provence/tmp/naver-provence-reranker-eval/naver-provence-reranker-debertav3-v1_mldr_en_th_0_5/process/dataset`
|
| 4 |
+
- Language: en
|
| 5 |
+
- LLM model: gpt-5-nano
|
| 6 |
+
- Reasoning effort: low
|
| 7 |
+
- Records evaluated: 174
|
| 8 |
+
- Ignored queries: 208
|
| 9 |
+
- Has answer (1): 147
|
| 10 |
+
- Has answer (0): 27
|
| 11 |
+
- Failed: 0
|
| 12 |
+
- Process time (s): 391.34
|
| 13 |
+
- LLM eval time (s): 181.44
|
| 14 |
+
|
| 15 |
+
## Answer Score Statistics
|
| 16 |
+
- mean: 0.8420
|
| 17 |
+
- median: 1.0000
|
| 18 |
+
- min: 0.0000
|
| 19 |
+
- max: 1.0000
|
eval_results/mldr/en_th_0_05/eval_summary.json
ADDED
|
@@ -0,0 +1,21 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"input_dataset": "/home/hotchpotch/src/github.com/hotchpotch/open_provence/tmp/mldr_runs/open-provence-reranker-v1/en_th_0_05_attempt1/process/dataset",
|
| 3 |
+
"language": "en",
|
| 4 |
+
"llm_model": "gpt-5-nano",
|
| 5 |
+
"reasoning_effort": "low",
|
| 6 |
+
"records_evaluated": 174,
|
| 7 |
+
"ignored_count": 208,
|
| 8 |
+
"counts": {
|
| 9 |
+
"has_answer_1": 164,
|
| 10 |
+
"has_answer_0": 10,
|
| 11 |
+
"failed": 0
|
| 12 |
+
},
|
| 13 |
+
"answer_score_stats": {
|
| 14 |
+
"mean": 0.9278735632183908,
|
| 15 |
+
"median": 1.0,
|
| 16 |
+
"min": 0.0,
|
| 17 |
+
"max": 1.0
|
| 18 |
+
},
|
| 19 |
+
"process_time_seconds": 261.30367420602124,
|
| 20 |
+
"evaluation_time_seconds": 29.534542897017673
|
| 21 |
+
}
|
eval_results/mldr/en_th_0_05/eval_summary.md
ADDED
|
@@ -0,0 +1,19 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# LLM Evaluation Summary
|
| 2 |
+
|
| 3 |
+
- Dataset: `/home/hotchpotch/src/github.com/hotchpotch/open_provence/tmp/mldr_runs/open-provence-reranker-v1/en_th_0_05_attempt1/process/dataset`
|
| 4 |
+
- Language: en
|
| 5 |
+
- LLM model: gpt-5-nano
|
| 6 |
+
- Reasoning effort: low
|
| 7 |
+
- Records evaluated: 174
|
| 8 |
+
- Ignored queries: 208
|
| 9 |
+
- Has answer (1): 164
|
| 10 |
+
- Has answer (0): 10
|
| 11 |
+
- Failed: 0
|
| 12 |
+
- Process time (s): 261.30
|
| 13 |
+
- LLM eval time (s): 29.53
|
| 14 |
+
|
| 15 |
+
## Answer Score Statistics
|
| 16 |
+
- mean: 0.9279
|
| 17 |
+
- median: 1.0000
|
| 18 |
+
- min: 0.0000
|
| 19 |
+
- max: 1.0000
|
eval_results/mldr/en_th_0_05/process_summary.json
ADDED
|
@@ -0,0 +1,17 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"limit": 200,
|
| 3 |
+
"threshold": 0.05,
|
| 4 |
+
"num_records": 1600,
|
| 5 |
+
"num_queries": 200,
|
| 6 |
+
"dataset_language": "en",
|
| 7 |
+
"splitter_language": "auto",
|
| 8 |
+
"max_length": null,
|
| 9 |
+
"model": "output/release_models/open-provence-reranker-v1",
|
| 10 |
+
"naver_provence_model": false,
|
| 11 |
+
"avg_pos_score": 0.7220386701822281,
|
| 12 |
+
"avg_neg_score": 0.16591052538582257,
|
| 13 |
+
"avg_pos_compression": 86.67305848274736,
|
| 14 |
+
"avg_neg_compression": 99.71228029348991,
|
| 15 |
+
"source_text": "pruned",
|
| 16 |
+
"process_time_seconds": 261.30367420602124
|
| 17 |
+
}
|
eval_results/mldr/en_th_0_1/eval_summary.json
ADDED
|
@@ -0,0 +1,21 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"input_dataset": "/home/hotchpotch/src/github.com/hotchpotch/open_provence/tmp/mldr_runs/open-provence-reranker-v1/en_th_0_1_attempt1/process/dataset",
|
| 3 |
+
"language": "en",
|
| 4 |
+
"llm_model": "gpt-5-nano",
|
| 5 |
+
"reasoning_effort": "low",
|
| 6 |
+
"records_evaluated": 174,
|
| 7 |
+
"ignored_count": 208,
|
| 8 |
+
"counts": {
|
| 9 |
+
"has_answer_1": 164,
|
| 10 |
+
"has_answer_0": 10,
|
| 11 |
+
"failed": 0
|
| 12 |
+
},
|
| 13 |
+
"answer_score_stats": {
|
| 14 |
+
"mean": 0.9351149425287357,
|
| 15 |
+
"median": 1.0,
|
| 16 |
+
"min": 0.0,
|
| 17 |
+
"max": 1.0
|
| 18 |
+
},
|
| 19 |
+
"process_time_seconds": 260.8915817589732,
|
| 20 |
+
"evaluation_time_seconds": 31.940818482078612
|
| 21 |
+
}
|
eval_results/mldr/en_th_0_1/eval_summary.md
ADDED
|
@@ -0,0 +1,19 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# LLM Evaluation Summary
|
| 2 |
+
|
| 3 |
+
- Dataset: `/home/hotchpotch/src/github.com/hotchpotch/open_provence/tmp/mldr_runs/open-provence-reranker-v1/en_th_0_1_attempt1/process/dataset`
|
| 4 |
+
- Language: en
|
| 5 |
+
- LLM model: gpt-5-nano
|
| 6 |
+
- Reasoning effort: low
|
| 7 |
+
- Records evaluated: 174
|
| 8 |
+
- Ignored queries: 208
|
| 9 |
+
- Has answer (1): 164
|
| 10 |
+
- Has answer (0): 10
|
| 11 |
+
- Failed: 0
|
| 12 |
+
- Process time (s): 260.89
|
| 13 |
+
- LLM eval time (s): 31.94
|
| 14 |
+
|
| 15 |
+
## Answer Score Statistics
|
| 16 |
+
- mean: 0.9351
|
| 17 |
+
- median: 1.0000
|
| 18 |
+
- min: 0.0000
|
| 19 |
+
- max: 1.0000
|
eval_results/mldr/en_th_0_1/process_summary.json
ADDED
|
@@ -0,0 +1,17 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"limit": 200,
|
| 3 |
+
"threshold": 0.1,
|
| 4 |
+
"num_records": 1600,
|
| 5 |
+
"num_queries": 200,
|
| 6 |
+
"dataset_language": "en",
|
| 7 |
+
"splitter_language": "auto",
|
| 8 |
+
"max_length": null,
|
| 9 |
+
"model": "output/release_models/open-provence-reranker-v1",
|
| 10 |
+
"naver_provence_model": false,
|
| 11 |
+
"avg_pos_score": 0.7186262372136116,
|
| 12 |
+
"avg_neg_score": 0.10100883937307767,
|
| 13 |
+
"avg_pos_compression": 92.32767405509574,
|
| 14 |
+
"avg_neg_compression": 99.91221173248853,
|
| 15 |
+
"source_text": "pruned",
|
| 16 |
+
"process_time_seconds": 260.8915817589732
|
| 17 |
+
}
|
eval_results/mldr/en_th_0_3/eval_summary.json
ADDED
|
@@ -0,0 +1,21 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"input_dataset": "/home/hotchpotch/src/github.com/hotchpotch/open_provence/tmp/mldr_runs/open-provence-reranker-v1/en_th_0_3_attempt1/process/dataset",
|
| 3 |
+
"language": "en",
|
| 4 |
+
"llm_model": "gpt-5-nano",
|
| 5 |
+
"reasoning_effort": "low",
|
| 6 |
+
"records_evaluated": 174,
|
| 7 |
+
"ignored_count": 208,
|
| 8 |
+
"counts": {
|
| 9 |
+
"has_answer_1": 157,
|
| 10 |
+
"has_answer_0": 17,
|
| 11 |
+
"failed": 0
|
| 12 |
+
},
|
| 13 |
+
"answer_score_stats": {
|
| 14 |
+
"mean": 0.8953448275862068,
|
| 15 |
+
"median": 1.0,
|
| 16 |
+
"min": 0.0,
|
| 17 |
+
"max": 1.0
|
| 18 |
+
},
|
| 19 |
+
"process_time_seconds": 261.1759908599779,
|
| 20 |
+
"evaluation_time_seconds": 27.776169850025326
|
| 21 |
+
}
|
eval_results/mldr/en_th_0_3/eval_summary.md
ADDED
|
@@ -0,0 +1,19 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# LLM Evaluation Summary
|
| 2 |
+
|
| 3 |
+
- Dataset: `/home/hotchpotch/src/github.com/hotchpotch/open_provence/tmp/mldr_runs/open-provence-reranker-v1/en_th_0_3_attempt1/process/dataset`
|
| 4 |
+
- Language: en
|
| 5 |
+
- LLM model: gpt-5-nano
|
| 6 |
+
- Reasoning effort: low
|
| 7 |
+
- Records evaluated: 174
|
| 8 |
+
- Ignored queries: 208
|
| 9 |
+
- Has answer (1): 157
|
| 10 |
+
- Has answer (0): 17
|
| 11 |
+
- Failed: 0
|
| 12 |
+
- Process time (s): 261.18
|
| 13 |
+
- LLM eval time (s): 27.78
|
| 14 |
+
|
| 15 |
+
## Answer Score Statistics
|
| 16 |
+
- mean: 0.8953
|
| 17 |
+
- median: 1.0000
|
| 18 |
+
- min: 0.0000
|
| 19 |
+
- max: 1.0000
|
eval_results/mldr/en_th_0_3/process_summary.json
ADDED
|
@@ -0,0 +1,17 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"limit": 200,
|
| 3 |
+
"threshold": 0.3,
|
| 4 |
+
"num_records": 1600,
|
| 5 |
+
"num_queries": 200,
|
| 6 |
+
"dataset_language": "en",
|
| 7 |
+
"splitter_language": "auto",
|
| 8 |
+
"max_length": null,
|
| 9 |
+
"model": "output/release_models/open-provence-reranker-v1",
|
| 10 |
+
"naver_provence_model": false,
|
| 11 |
+
"avg_pos_score": 0.715216779410839,
|
| 12 |
+
"avg_neg_score": 0.02076476133295468,
|
| 13 |
+
"avg_pos_compression": 96.97861135663942,
|
| 14 |
+
"avg_neg_compression": 99.993944709442,
|
| 15 |
+
"source_text": "pruned",
|
| 16 |
+
"process_time_seconds": 261.1759908599779
|
| 17 |
+
}
|
eval_results/mldr/en_th_0_5/eval_summary.json
ADDED
|
@@ -0,0 +1,21 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"input_dataset": "/home/hotchpotch/src/github.com/hotchpotch/open_provence/tmp/mldr_runs/open-provence-reranker-v1/en_th_0_5_attempt1/process/dataset",
|
| 3 |
+
"language": "en",
|
| 4 |
+
"llm_model": "gpt-5-nano",
|
| 5 |
+
"reasoning_effort": "low",
|
| 6 |
+
"records_evaluated": 174,
|
| 7 |
+
"ignored_count": 208,
|
| 8 |
+
"counts": {
|
| 9 |
+
"has_answer_1": 152,
|
| 10 |
+
"has_answer_0": 22,
|
| 11 |
+
"failed": 0
|
| 12 |
+
},
|
| 13 |
+
"answer_score_stats": {
|
| 14 |
+
"mean": 0.8660919540229884,
|
| 15 |
+
"median": 1.0,
|
| 16 |
+
"min": 0.0,
|
| 17 |
+
"max": 1.0
|
| 18 |
+
},
|
| 19 |
+
"process_time_seconds": 261.31356202194,
|
| 20 |
+
"evaluation_time_seconds": 25.42166205099784
|
| 21 |
+
}
|
eval_results/mldr/en_th_0_5/eval_summary.md
ADDED
|
@@ -0,0 +1,19 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# LLM Evaluation Summary
|
| 2 |
+
|
| 3 |
+
- Dataset: `/home/hotchpotch/src/github.com/hotchpotch/open_provence/tmp/mldr_runs/open-provence-reranker-v1/en_th_0_5_attempt1/process/dataset`
|
| 4 |
+
- Language: en
|
| 5 |
+
- LLM model: gpt-5-nano
|
| 6 |
+
- Reasoning effort: low
|
| 7 |
+
- Records evaluated: 174
|
| 8 |
+
- Ignored queries: 208
|
| 9 |
+
- Has answer (1): 152
|
| 10 |
+
- Has answer (0): 22
|
| 11 |
+
- Failed: 0
|
| 12 |
+
- Process time (s): 261.31
|
| 13 |
+
- LLM eval time (s): 25.42
|
| 14 |
+
|
| 15 |
+
## Answer Score Statistics
|
| 16 |
+
- mean: 0.8661
|
| 17 |
+
- median: 1.0000
|
| 18 |
+
- min: 0.0000
|
| 19 |
+
- max: 1.0000
|
eval_results/mldr/en_th_0_5/process_summary.json
ADDED
|
@@ -0,0 +1,17 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"limit": 200,
|
| 3 |
+
"threshold": 0.5,
|
| 4 |
+
"num_records": 1600,
|
| 5 |
+
"num_queries": 200,
|
| 6 |
+
"dataset_language": "en",
|
| 7 |
+
"splitter_language": "auto",
|
| 8 |
+
"max_length": null,
|
| 9 |
+
"model": "output/release_models/open-provence-reranker-v1",
|
| 10 |
+
"naver_provence_model": false,
|
| 11 |
+
"avg_pos_score": 0.6940265846252441,
|
| 12 |
+
"avg_neg_score": 0.006882384909050805,
|
| 13 |
+
"avg_pos_compression": 98.24189101722801,
|
| 14 |
+
"avg_neg_compression": 99.99934651299124,
|
| 15 |
+
"source_text": "pruned",
|
| 16 |
+
"process_time_seconds": 261.31356202194
|
| 17 |
+
}
|
eval_results/naver-provence-reranker-debertav3-v1_mldr_en_th_0_1.md
ADDED
|
@@ -0,0 +1,17 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# LLM Evaluation Summary
|
| 2 |
+
|
| 3 |
+
- Dataset: `/home/hotchpotch/src/github.com/hotchpotch/open_provence/tmp/mldr_runs/naver-provence-reranker-debertav3-v1/mldr_en_th_0_1/process/dataset`
|
| 4 |
+
- Language: en
|
| 5 |
+
- LLM model: gpt-5-mini
|
| 6 |
+
- Reasoning effort: low
|
| 7 |
+
- Records evaluated: 174
|
| 8 |
+
- Ignored queries: 208
|
| 9 |
+
- Has answer (1): 159
|
| 10 |
+
- Has answer (0): 15
|
| 11 |
+
- Failed: 0
|
| 12 |
+
|
| 13 |
+
## Answer Score Statistics
|
| 14 |
+
- mean: 0.9115
|
| 15 |
+
- median: 1.0000
|
| 16 |
+
- min: 0.0000
|
| 17 |
+
- max: 1.0000
|
eval_results/naver-xprovence-reranker-bgem3-v1_mldr_en_th_0_3.md
ADDED
|
@@ -0,0 +1,17 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# LLM Evaluation Summary
|
| 2 |
+
|
| 3 |
+
- Dataset: `/home/hotchpotch/src/github.com/hotchpotch/open_provence/tmp/mldr_runs/naver-xprovence-reranker-bgem3-v1/mldr_en_th_0_3/process/dataset`
|
| 4 |
+
- Language: en
|
| 5 |
+
- LLM model: gpt-5-mini
|
| 6 |
+
- Reasoning effort: low
|
| 7 |
+
- Records evaluated: 174
|
| 8 |
+
- Ignored queries: 208
|
| 9 |
+
- Has answer (1): 74
|
| 10 |
+
- Has answer (0): 100
|
| 11 |
+
- Failed: 0
|
| 12 |
+
|
| 13 |
+
## Answer Score Statistics
|
| 14 |
+
- mean: 0.4306
|
| 15 |
+
- median: 0.0500
|
| 16 |
+
- min: 0.0000
|
| 17 |
+
- max: 1.0000
|
model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5eaba6f11f47c1d595b837d617effcbfe72b6a4adc9ce8fce58d1b59baabe4e6
|
| 3 |
+
size 598444940
|
modeling_open_provence_standalone.py
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
special_tokens_map.json
ADDED
|
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"cls_token": {
|
| 3 |
+
"content": "[CLS]",
|
| 4 |
+
"lstrip": false,
|
| 5 |
+
"normalized": false,
|
| 6 |
+
"rstrip": false,
|
| 7 |
+
"single_word": false
|
| 8 |
+
},
|
| 9 |
+
"mask_token": {
|
| 10 |
+
"content": "[MASK]",
|
| 11 |
+
"lstrip": true,
|
| 12 |
+
"normalized": false,
|
| 13 |
+
"rstrip": false,
|
| 14 |
+
"single_word": false
|
| 15 |
+
},
|
| 16 |
+
"pad_token": {
|
| 17 |
+
"content": "[PAD]",
|
| 18 |
+
"lstrip": false,
|
| 19 |
+
"normalized": false,
|
| 20 |
+
"rstrip": false,
|
| 21 |
+
"single_word": false
|
| 22 |
+
},
|
| 23 |
+
"sep_token": {
|
| 24 |
+
"content": "[SEP]",
|
| 25 |
+
"lstrip": false,
|
| 26 |
+
"normalized": false,
|
| 27 |
+
"rstrip": false,
|
| 28 |
+
"single_word": false
|
| 29 |
+
},
|
| 30 |
+
"unk_token": {
|
| 31 |
+
"content": "[UNK]",
|
| 32 |
+
"lstrip": false,
|
| 33 |
+
"normalized": false,
|
| 34 |
+
"rstrip": false,
|
| 35 |
+
"single_word": false
|
| 36 |
+
}
|
| 37 |
+
}
|
tokenizer.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
tokenizer_config.json
ADDED
|
@@ -0,0 +1,952 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"added_tokens_decoder": {
|
| 3 |
+
"0": {
|
| 4 |
+
"content": "|||IP_ADDRESS|||",
|
| 5 |
+
"lstrip": false,
|
| 6 |
+
"normalized": true,
|
| 7 |
+
"rstrip": false,
|
| 8 |
+
"single_word": false,
|
| 9 |
+
"special": false
|
| 10 |
+
},
|
| 11 |
+
"1": {
|
| 12 |
+
"content": "<|padding|>",
|
| 13 |
+
"lstrip": false,
|
| 14 |
+
"normalized": false,
|
| 15 |
+
"rstrip": false,
|
| 16 |
+
"single_word": false,
|
| 17 |
+
"special": true
|
| 18 |
+
},
|
| 19 |
+
"50254": {
|
| 20 |
+
"content": " ",
|
| 21 |
+
"lstrip": false,
|
| 22 |
+
"normalized": true,
|
| 23 |
+
"rstrip": false,
|
| 24 |
+
"single_word": false,
|
| 25 |
+
"special": false
|
| 26 |
+
},
|
| 27 |
+
"50255": {
|
| 28 |
+
"content": " ",
|
| 29 |
+
"lstrip": false,
|
| 30 |
+
"normalized": true,
|
| 31 |
+
"rstrip": false,
|
| 32 |
+
"single_word": false,
|
| 33 |
+
"special": false
|
| 34 |
+
},
|
| 35 |
+
"50256": {
|
| 36 |
+
"content": " ",
|
| 37 |
+
"lstrip": false,
|
| 38 |
+
"normalized": true,
|
| 39 |
+
"rstrip": false,
|
| 40 |
+
"single_word": false,
|
| 41 |
+
"special": false
|
| 42 |
+
},
|
| 43 |
+
"50257": {
|
| 44 |
+
"content": " ",
|
| 45 |
+
"lstrip": false,
|
| 46 |
+
"normalized": true,
|
| 47 |
+
"rstrip": false,
|
| 48 |
+
"single_word": false,
|
| 49 |
+
"special": false
|
| 50 |
+
},
|
| 51 |
+
"50258": {
|
| 52 |
+
"content": " ",
|
| 53 |
+
"lstrip": false,
|
| 54 |
+
"normalized": true,
|
| 55 |
+
"rstrip": false,
|
| 56 |
+
"single_word": false,
|
| 57 |
+
"special": false
|
| 58 |
+
},
|
| 59 |
+
"50259": {
|
| 60 |
+
"content": " ",
|
| 61 |
+
"lstrip": false,
|
| 62 |
+
"normalized": true,
|
| 63 |
+
"rstrip": false,
|
| 64 |
+
"single_word": false,
|
| 65 |
+
"special": false
|
| 66 |
+
},
|
| 67 |
+
"50260": {
|
| 68 |
+
"content": " ",
|
| 69 |
+
"lstrip": false,
|
| 70 |
+
"normalized": true,
|
| 71 |
+
"rstrip": false,
|
| 72 |
+
"single_word": false,
|
| 73 |
+
"special": false
|
| 74 |
+
},
|
| 75 |
+
"50261": {
|
| 76 |
+
"content": " ",
|
| 77 |
+
"lstrip": false,
|
| 78 |
+
"normalized": true,
|
| 79 |
+
"rstrip": false,
|
| 80 |
+
"single_word": false,
|
| 81 |
+
"special": false
|
| 82 |
+
},
|
| 83 |
+
"50262": {
|
| 84 |
+
"content": " ",
|
| 85 |
+
"lstrip": false,
|
| 86 |
+
"normalized": true,
|
| 87 |
+
"rstrip": false,
|
| 88 |
+
"single_word": false,
|
| 89 |
+
"special": false
|
| 90 |
+
},
|
| 91 |
+
"50263": {
|
| 92 |
+
"content": " ",
|
| 93 |
+
"lstrip": false,
|
| 94 |
+
"normalized": true,
|
| 95 |
+
"rstrip": false,
|
| 96 |
+
"single_word": false,
|
| 97 |
+
"special": false
|
| 98 |
+
},
|
| 99 |
+
"50264": {
|
| 100 |
+
"content": " ",
|
| 101 |
+
"lstrip": false,
|
| 102 |
+
"normalized": true,
|
| 103 |
+
"rstrip": false,
|
| 104 |
+
"single_word": false,
|
| 105 |
+
"special": false
|
| 106 |
+
},
|
| 107 |
+
"50265": {
|
| 108 |
+
"content": " ",
|
| 109 |
+
"lstrip": false,
|
| 110 |
+
"normalized": true,
|
| 111 |
+
"rstrip": false,
|
| 112 |
+
"single_word": false,
|
| 113 |
+
"special": false
|
| 114 |
+
},
|
| 115 |
+
"50266": {
|
| 116 |
+
"content": " ",
|
| 117 |
+
"lstrip": false,
|
| 118 |
+
"normalized": true,
|
| 119 |
+
"rstrip": false,
|
| 120 |
+
"single_word": false,
|
| 121 |
+
"special": false
|
| 122 |
+
},
|
| 123 |
+
"50267": {
|
| 124 |
+
"content": " ",
|
| 125 |
+
"lstrip": false,
|
| 126 |
+
"normalized": true,
|
| 127 |
+
"rstrip": false,
|
| 128 |
+
"single_word": false,
|
| 129 |
+
"special": false
|
| 130 |
+
},
|
| 131 |
+
"50268": {
|
| 132 |
+
"content": " ",
|
| 133 |
+
"lstrip": false,
|
| 134 |
+
"normalized": true,
|
| 135 |
+
"rstrip": false,
|
| 136 |
+
"single_word": false,
|
| 137 |
+
"special": false
|
| 138 |
+
},
|
| 139 |
+
"50269": {
|
| 140 |
+
"content": " ",
|
| 141 |
+
"lstrip": false,
|
| 142 |
+
"normalized": true,
|
| 143 |
+
"rstrip": false,
|
| 144 |
+
"single_word": false,
|
| 145 |
+
"special": false
|
| 146 |
+
},
|
| 147 |
+
"50270": {
|
| 148 |
+
"content": " ",
|
| 149 |
+
"lstrip": false,
|
| 150 |
+
"normalized": true,
|
| 151 |
+
"rstrip": false,
|
| 152 |
+
"single_word": false,
|
| 153 |
+
"special": false
|
| 154 |
+
},
|
| 155 |
+
"50271": {
|
| 156 |
+
"content": " ",
|
| 157 |
+
"lstrip": false,
|
| 158 |
+
"normalized": true,
|
| 159 |
+
"rstrip": false,
|
| 160 |
+
"single_word": false,
|
| 161 |
+
"special": false
|
| 162 |
+
},
|
| 163 |
+
"50272": {
|
| 164 |
+
"content": " ",
|
| 165 |
+
"lstrip": false,
|
| 166 |
+
"normalized": true,
|
| 167 |
+
"rstrip": false,
|
| 168 |
+
"single_word": false,
|
| 169 |
+
"special": false
|
| 170 |
+
},
|
| 171 |
+
"50273": {
|
| 172 |
+
"content": " ",
|
| 173 |
+
"lstrip": false,
|
| 174 |
+
"normalized": true,
|
| 175 |
+
"rstrip": false,
|
| 176 |
+
"single_word": false,
|
| 177 |
+
"special": false
|
| 178 |
+
},
|
| 179 |
+
"50274": {
|
| 180 |
+
"content": " ",
|
| 181 |
+
"lstrip": false,
|
| 182 |
+
"normalized": true,
|
| 183 |
+
"rstrip": false,
|
| 184 |
+
"single_word": false,
|
| 185 |
+
"special": false
|
| 186 |
+
},
|
| 187 |
+
"50275": {
|
| 188 |
+
"content": " ",
|
| 189 |
+
"lstrip": false,
|
| 190 |
+
"normalized": true,
|
| 191 |
+
"rstrip": false,
|
| 192 |
+
"single_word": false,
|
| 193 |
+
"special": false
|
| 194 |
+
},
|
| 195 |
+
"50276": {
|
| 196 |
+
"content": " ",
|
| 197 |
+
"lstrip": false,
|
| 198 |
+
"normalized": true,
|
| 199 |
+
"rstrip": false,
|
| 200 |
+
"single_word": false,
|
| 201 |
+
"special": false
|
| 202 |
+
},
|
| 203 |
+
"50277": {
|
| 204 |
+
"content": "|||EMAIL_ADDRESS|||",
|
| 205 |
+
"lstrip": false,
|
| 206 |
+
"normalized": true,
|
| 207 |
+
"rstrip": false,
|
| 208 |
+
"single_word": false,
|
| 209 |
+
"special": false
|
| 210 |
+
},
|
| 211 |
+
"50278": {
|
| 212 |
+
"content": "|||PHONE_NUMBER|||",
|
| 213 |
+
"lstrip": false,
|
| 214 |
+
"normalized": true,
|
| 215 |
+
"rstrip": false,
|
| 216 |
+
"single_word": false,
|
| 217 |
+
"special": false
|
| 218 |
+
},
|
| 219 |
+
"50279": {
|
| 220 |
+
"content": "<|endoftext|>",
|
| 221 |
+
"lstrip": false,
|
| 222 |
+
"normalized": false,
|
| 223 |
+
"rstrip": false,
|
| 224 |
+
"single_word": false,
|
| 225 |
+
"special": true
|
| 226 |
+
},
|
| 227 |
+
"50280": {
|
| 228 |
+
"content": "[UNK]",
|
| 229 |
+
"lstrip": false,
|
| 230 |
+
"normalized": false,
|
| 231 |
+
"rstrip": false,
|
| 232 |
+
"single_word": false,
|
| 233 |
+
"special": true
|
| 234 |
+
},
|
| 235 |
+
"50281": {
|
| 236 |
+
"content": "[CLS]",
|
| 237 |
+
"lstrip": false,
|
| 238 |
+
"normalized": false,
|
| 239 |
+
"rstrip": false,
|
| 240 |
+
"single_word": false,
|
| 241 |
+
"special": true
|
| 242 |
+
},
|
| 243 |
+
"50282": {
|
| 244 |
+
"content": "[SEP]",
|
| 245 |
+
"lstrip": false,
|
| 246 |
+
"normalized": false,
|
| 247 |
+
"rstrip": false,
|
| 248 |
+
"single_word": false,
|
| 249 |
+
"special": true
|
| 250 |
+
},
|
| 251 |
+
"50283": {
|
| 252 |
+
"content": "[PAD]",
|
| 253 |
+
"lstrip": false,
|
| 254 |
+
"normalized": false,
|
| 255 |
+
"rstrip": false,
|
| 256 |
+
"single_word": false,
|
| 257 |
+
"special": true
|
| 258 |
+
},
|
| 259 |
+
"50284": {
|
| 260 |
+
"content": "[MASK]",
|
| 261 |
+
"lstrip": true,
|
| 262 |
+
"normalized": false,
|
| 263 |
+
"rstrip": false,
|
| 264 |
+
"single_word": false,
|
| 265 |
+
"special": true
|
| 266 |
+
},
|
| 267 |
+
"50285": {
|
| 268 |
+
"content": "[unused0]",
|
| 269 |
+
"lstrip": false,
|
| 270 |
+
"normalized": true,
|
| 271 |
+
"rstrip": false,
|
| 272 |
+
"single_word": false,
|
| 273 |
+
"special": false
|
| 274 |
+
},
|
| 275 |
+
"50286": {
|
| 276 |
+
"content": "[unused1]",
|
| 277 |
+
"lstrip": false,
|
| 278 |
+
"normalized": true,
|
| 279 |
+
"rstrip": false,
|
| 280 |
+
"single_word": false,
|
| 281 |
+
"special": false
|
| 282 |
+
},
|
| 283 |
+
"50287": {
|
| 284 |
+
"content": "[unused2]",
|
| 285 |
+
"lstrip": false,
|
| 286 |
+
"normalized": true,
|
| 287 |
+
"rstrip": false,
|
| 288 |
+
"single_word": false,
|
| 289 |
+
"special": false
|
| 290 |
+
},
|
| 291 |
+
"50288": {
|
| 292 |
+
"content": "[unused3]",
|
| 293 |
+
"lstrip": false,
|
| 294 |
+
"normalized": true,
|
| 295 |
+
"rstrip": false,
|
| 296 |
+
"single_word": false,
|
| 297 |
+
"special": false
|
| 298 |
+
},
|
| 299 |
+
"50289": {
|
| 300 |
+
"content": "[unused4]",
|
| 301 |
+
"lstrip": false,
|
| 302 |
+
"normalized": true,
|
| 303 |
+
"rstrip": false,
|
| 304 |
+
"single_word": false,
|
| 305 |
+
"special": false
|
| 306 |
+
},
|
| 307 |
+
"50290": {
|
| 308 |
+
"content": "[unused5]",
|
| 309 |
+
"lstrip": false,
|
| 310 |
+
"normalized": true,
|
| 311 |
+
"rstrip": false,
|
| 312 |
+
"single_word": false,
|
| 313 |
+
"special": false
|
| 314 |
+
},
|
| 315 |
+
"50291": {
|
| 316 |
+
"content": "[unused6]",
|
| 317 |
+
"lstrip": false,
|
| 318 |
+
"normalized": true,
|
| 319 |
+
"rstrip": false,
|
| 320 |
+
"single_word": false,
|
| 321 |
+
"special": false
|
| 322 |
+
},
|
| 323 |
+
"50292": {
|
| 324 |
+
"content": "[unused7]",
|
| 325 |
+
"lstrip": false,
|
| 326 |
+
"normalized": true,
|
| 327 |
+
"rstrip": false,
|
| 328 |
+
"single_word": false,
|
| 329 |
+
"special": false
|
| 330 |
+
},
|
| 331 |
+
"50293": {
|
| 332 |
+
"content": "[unused8]",
|
| 333 |
+
"lstrip": false,
|
| 334 |
+
"normalized": true,
|
| 335 |
+
"rstrip": false,
|
| 336 |
+
"single_word": false,
|
| 337 |
+
"special": false
|
| 338 |
+
},
|
| 339 |
+
"50294": {
|
| 340 |
+
"content": "[unused9]",
|
| 341 |
+
"lstrip": false,
|
| 342 |
+
"normalized": true,
|
| 343 |
+
"rstrip": false,
|
| 344 |
+
"single_word": false,
|
| 345 |
+
"special": false
|
| 346 |
+
},
|
| 347 |
+
"50295": {
|
| 348 |
+
"content": "[unused10]",
|
| 349 |
+
"lstrip": false,
|
| 350 |
+
"normalized": true,
|
| 351 |
+
"rstrip": false,
|
| 352 |
+
"single_word": false,
|
| 353 |
+
"special": false
|
| 354 |
+
},
|
| 355 |
+
"50296": {
|
| 356 |
+
"content": "[unused11]",
|
| 357 |
+
"lstrip": false,
|
| 358 |
+
"normalized": true,
|
| 359 |
+
"rstrip": false,
|
| 360 |
+
"single_word": false,
|
| 361 |
+
"special": false
|
| 362 |
+
},
|
| 363 |
+
"50297": {
|
| 364 |
+
"content": "[unused12]",
|
| 365 |
+
"lstrip": false,
|
| 366 |
+
"normalized": true,
|
| 367 |
+
"rstrip": false,
|
| 368 |
+
"single_word": false,
|
| 369 |
+
"special": false
|
| 370 |
+
},
|
| 371 |
+
"50298": {
|
| 372 |
+
"content": "[unused13]",
|
| 373 |
+
"lstrip": false,
|
| 374 |
+
"normalized": true,
|
| 375 |
+
"rstrip": false,
|
| 376 |
+
"single_word": false,
|
| 377 |
+
"special": false
|
| 378 |
+
},
|
| 379 |
+
"50299": {
|
| 380 |
+
"content": "[unused14]",
|
| 381 |
+
"lstrip": false,
|
| 382 |
+
"normalized": true,
|
| 383 |
+
"rstrip": false,
|
| 384 |
+
"single_word": false,
|
| 385 |
+
"special": false
|
| 386 |
+
},
|
| 387 |
+
"50300": {
|
| 388 |
+
"content": "[unused15]",
|
| 389 |
+
"lstrip": false,
|
| 390 |
+
"normalized": true,
|
| 391 |
+
"rstrip": false,
|
| 392 |
+
"single_word": false,
|
| 393 |
+
"special": false
|
| 394 |
+
},
|
| 395 |
+
"50301": {
|
| 396 |
+
"content": "[unused16]",
|
| 397 |
+
"lstrip": false,
|
| 398 |
+
"normalized": true,
|
| 399 |
+
"rstrip": false,
|
| 400 |
+
"single_word": false,
|
| 401 |
+
"special": false
|
| 402 |
+
},
|
| 403 |
+
"50302": {
|
| 404 |
+
"content": "[unused17]",
|
| 405 |
+
"lstrip": false,
|
| 406 |
+
"normalized": true,
|
| 407 |
+
"rstrip": false,
|
| 408 |
+
"single_word": false,
|
| 409 |
+
"special": false
|
| 410 |
+
},
|
| 411 |
+
"50303": {
|
| 412 |
+
"content": "[unused18]",
|
| 413 |
+
"lstrip": false,
|
| 414 |
+
"normalized": true,
|
| 415 |
+
"rstrip": false,
|
| 416 |
+
"single_word": false,
|
| 417 |
+
"special": false
|
| 418 |
+
},
|
| 419 |
+
"50304": {
|
| 420 |
+
"content": "[unused19]",
|
| 421 |
+
"lstrip": false,
|
| 422 |
+
"normalized": true,
|
| 423 |
+
"rstrip": false,
|
| 424 |
+
"single_word": false,
|
| 425 |
+
"special": false
|
| 426 |
+
},
|
| 427 |
+
"50305": {
|
| 428 |
+
"content": "[unused20]",
|
| 429 |
+
"lstrip": false,
|
| 430 |
+
"normalized": true,
|
| 431 |
+
"rstrip": false,
|
| 432 |
+
"single_word": false,
|
| 433 |
+
"special": false
|
| 434 |
+
},
|
| 435 |
+
"50306": {
|
| 436 |
+
"content": "[unused21]",
|
| 437 |
+
"lstrip": false,
|
| 438 |
+
"normalized": true,
|
| 439 |
+
"rstrip": false,
|
| 440 |
+
"single_word": false,
|
| 441 |
+
"special": false
|
| 442 |
+
},
|
| 443 |
+
"50307": {
|
| 444 |
+
"content": "[unused22]",
|
| 445 |
+
"lstrip": false,
|
| 446 |
+
"normalized": true,
|
| 447 |
+
"rstrip": false,
|
| 448 |
+
"single_word": false,
|
| 449 |
+
"special": false
|
| 450 |
+
},
|
| 451 |
+
"50308": {
|
| 452 |
+
"content": "[unused23]",
|
| 453 |
+
"lstrip": false,
|
| 454 |
+
"normalized": true,
|
| 455 |
+
"rstrip": false,
|
| 456 |
+
"single_word": false,
|
| 457 |
+
"special": false
|
| 458 |
+
},
|
| 459 |
+
"50309": {
|
| 460 |
+
"content": "[unused24]",
|
| 461 |
+
"lstrip": false,
|
| 462 |
+
"normalized": true,
|
| 463 |
+
"rstrip": false,
|
| 464 |
+
"single_word": false,
|
| 465 |
+
"special": false
|
| 466 |
+
},
|
| 467 |
+
"50310": {
|
| 468 |
+
"content": "[unused25]",
|
| 469 |
+
"lstrip": false,
|
| 470 |
+
"normalized": true,
|
| 471 |
+
"rstrip": false,
|
| 472 |
+
"single_word": false,
|
| 473 |
+
"special": false
|
| 474 |
+
},
|
| 475 |
+
"50311": {
|
| 476 |
+
"content": "[unused26]",
|
| 477 |
+
"lstrip": false,
|
| 478 |
+
"normalized": true,
|
| 479 |
+
"rstrip": false,
|
| 480 |
+
"single_word": false,
|
| 481 |
+
"special": false
|
| 482 |
+
},
|
| 483 |
+
"50312": {
|
| 484 |
+
"content": "[unused27]",
|
| 485 |
+
"lstrip": false,
|
| 486 |
+
"normalized": true,
|
| 487 |
+
"rstrip": false,
|
| 488 |
+
"single_word": false,
|
| 489 |
+
"special": false
|
| 490 |
+
},
|
| 491 |
+
"50313": {
|
| 492 |
+
"content": "[unused28]",
|
| 493 |
+
"lstrip": false,
|
| 494 |
+
"normalized": true,
|
| 495 |
+
"rstrip": false,
|
| 496 |
+
"single_word": false,
|
| 497 |
+
"special": false
|
| 498 |
+
},
|
| 499 |
+
"50314": {
|
| 500 |
+
"content": "[unused29]",
|
| 501 |
+
"lstrip": false,
|
| 502 |
+
"normalized": true,
|
| 503 |
+
"rstrip": false,
|
| 504 |
+
"single_word": false,
|
| 505 |
+
"special": false
|
| 506 |
+
},
|
| 507 |
+
"50315": {
|
| 508 |
+
"content": "[unused30]",
|
| 509 |
+
"lstrip": false,
|
| 510 |
+
"normalized": true,
|
| 511 |
+
"rstrip": false,
|
| 512 |
+
"single_word": false,
|
| 513 |
+
"special": false
|
| 514 |
+
},
|
| 515 |
+
"50316": {
|
| 516 |
+
"content": "[unused31]",
|
| 517 |
+
"lstrip": false,
|
| 518 |
+
"normalized": true,
|
| 519 |
+
"rstrip": false,
|
| 520 |
+
"single_word": false,
|
| 521 |
+
"special": false
|
| 522 |
+
},
|
| 523 |
+
"50317": {
|
| 524 |
+
"content": "[unused32]",
|
| 525 |
+
"lstrip": false,
|
| 526 |
+
"normalized": true,
|
| 527 |
+
"rstrip": false,
|
| 528 |
+
"single_word": false,
|
| 529 |
+
"special": false
|
| 530 |
+
},
|
| 531 |
+
"50318": {
|
| 532 |
+
"content": "[unused33]",
|
| 533 |
+
"lstrip": false,
|
| 534 |
+
"normalized": true,
|
| 535 |
+
"rstrip": false,
|
| 536 |
+
"single_word": false,
|
| 537 |
+
"special": false
|
| 538 |
+
},
|
| 539 |
+
"50319": {
|
| 540 |
+
"content": "[unused34]",
|
| 541 |
+
"lstrip": false,
|
| 542 |
+
"normalized": true,
|
| 543 |
+
"rstrip": false,
|
| 544 |
+
"single_word": false,
|
| 545 |
+
"special": false
|
| 546 |
+
},
|
| 547 |
+
"50320": {
|
| 548 |
+
"content": "[unused35]",
|
| 549 |
+
"lstrip": false,
|
| 550 |
+
"normalized": true,
|
| 551 |
+
"rstrip": false,
|
| 552 |
+
"single_word": false,
|
| 553 |
+
"special": false
|
| 554 |
+
},
|
| 555 |
+
"50321": {
|
| 556 |
+
"content": "[unused36]",
|
| 557 |
+
"lstrip": false,
|
| 558 |
+
"normalized": true,
|
| 559 |
+
"rstrip": false,
|
| 560 |
+
"single_word": false,
|
| 561 |
+
"special": false
|
| 562 |
+
},
|
| 563 |
+
"50322": {
|
| 564 |
+
"content": "[unused37]",
|
| 565 |
+
"lstrip": false,
|
| 566 |
+
"normalized": true,
|
| 567 |
+
"rstrip": false,
|
| 568 |
+
"single_word": false,
|
| 569 |
+
"special": false
|
| 570 |
+
},
|
| 571 |
+
"50323": {
|
| 572 |
+
"content": "[unused38]",
|
| 573 |
+
"lstrip": false,
|
| 574 |
+
"normalized": true,
|
| 575 |
+
"rstrip": false,
|
| 576 |
+
"single_word": false,
|
| 577 |
+
"special": false
|
| 578 |
+
},
|
| 579 |
+
"50324": {
|
| 580 |
+
"content": "[unused39]",
|
| 581 |
+
"lstrip": false,
|
| 582 |
+
"normalized": true,
|
| 583 |
+
"rstrip": false,
|
| 584 |
+
"single_word": false,
|
| 585 |
+
"special": false
|
| 586 |
+
},
|
| 587 |
+
"50325": {
|
| 588 |
+
"content": "[unused40]",
|
| 589 |
+
"lstrip": false,
|
| 590 |
+
"normalized": true,
|
| 591 |
+
"rstrip": false,
|
| 592 |
+
"single_word": false,
|
| 593 |
+
"special": false
|
| 594 |
+
},
|
| 595 |
+
"50326": {
|
| 596 |
+
"content": "[unused41]",
|
| 597 |
+
"lstrip": false,
|
| 598 |
+
"normalized": true,
|
| 599 |
+
"rstrip": false,
|
| 600 |
+
"single_word": false,
|
| 601 |
+
"special": false
|
| 602 |
+
},
|
| 603 |
+
"50327": {
|
| 604 |
+
"content": "[unused42]",
|
| 605 |
+
"lstrip": false,
|
| 606 |
+
"normalized": true,
|
| 607 |
+
"rstrip": false,
|
| 608 |
+
"single_word": false,
|
| 609 |
+
"special": false
|
| 610 |
+
},
|
| 611 |
+
"50328": {
|
| 612 |
+
"content": "[unused43]",
|
| 613 |
+
"lstrip": false,
|
| 614 |
+
"normalized": true,
|
| 615 |
+
"rstrip": false,
|
| 616 |
+
"single_word": false,
|
| 617 |
+
"special": false
|
| 618 |
+
},
|
| 619 |
+
"50329": {
|
| 620 |
+
"content": "[unused44]",
|
| 621 |
+
"lstrip": false,
|
| 622 |
+
"normalized": true,
|
| 623 |
+
"rstrip": false,
|
| 624 |
+
"single_word": false,
|
| 625 |
+
"special": false
|
| 626 |
+
},
|
| 627 |
+
"50330": {
|
| 628 |
+
"content": "[unused45]",
|
| 629 |
+
"lstrip": false,
|
| 630 |
+
"normalized": true,
|
| 631 |
+
"rstrip": false,
|
| 632 |
+
"single_word": false,
|
| 633 |
+
"special": false
|
| 634 |
+
},
|
| 635 |
+
"50331": {
|
| 636 |
+
"content": "[unused46]",
|
| 637 |
+
"lstrip": false,
|
| 638 |
+
"normalized": true,
|
| 639 |
+
"rstrip": false,
|
| 640 |
+
"single_word": false,
|
| 641 |
+
"special": false
|
| 642 |
+
},
|
| 643 |
+
"50332": {
|
| 644 |
+
"content": "[unused47]",
|
| 645 |
+
"lstrip": false,
|
| 646 |
+
"normalized": true,
|
| 647 |
+
"rstrip": false,
|
| 648 |
+
"single_word": false,
|
| 649 |
+
"special": false
|
| 650 |
+
},
|
| 651 |
+
"50333": {
|
| 652 |
+
"content": "[unused48]",
|
| 653 |
+
"lstrip": false,
|
| 654 |
+
"normalized": true,
|
| 655 |
+
"rstrip": false,
|
| 656 |
+
"single_word": false,
|
| 657 |
+
"special": false
|
| 658 |
+
},
|
| 659 |
+
"50334": {
|
| 660 |
+
"content": "[unused49]",
|
| 661 |
+
"lstrip": false,
|
| 662 |
+
"normalized": true,
|
| 663 |
+
"rstrip": false,
|
| 664 |
+
"single_word": false,
|
| 665 |
+
"special": false
|
| 666 |
+
},
|
| 667 |
+
"50335": {
|
| 668 |
+
"content": "[unused50]",
|
| 669 |
+
"lstrip": false,
|
| 670 |
+
"normalized": true,
|
| 671 |
+
"rstrip": false,
|
| 672 |
+
"single_word": false,
|
| 673 |
+
"special": false
|
| 674 |
+
},
|
| 675 |
+
"50336": {
|
| 676 |
+
"content": "[unused51]",
|
| 677 |
+
"lstrip": false,
|
| 678 |
+
"normalized": true,
|
| 679 |
+
"rstrip": false,
|
| 680 |
+
"single_word": false,
|
| 681 |
+
"special": false
|
| 682 |
+
},
|
| 683 |
+
"50337": {
|
| 684 |
+
"content": "[unused52]",
|
| 685 |
+
"lstrip": false,
|
| 686 |
+
"normalized": true,
|
| 687 |
+
"rstrip": false,
|
| 688 |
+
"single_word": false,
|
| 689 |
+
"special": false
|
| 690 |
+
},
|
| 691 |
+
"50338": {
|
| 692 |
+
"content": "[unused53]",
|
| 693 |
+
"lstrip": false,
|
| 694 |
+
"normalized": true,
|
| 695 |
+
"rstrip": false,
|
| 696 |
+
"single_word": false,
|
| 697 |
+
"special": false
|
| 698 |
+
},
|
| 699 |
+
"50339": {
|
| 700 |
+
"content": "[unused54]",
|
| 701 |
+
"lstrip": false,
|
| 702 |
+
"normalized": true,
|
| 703 |
+
"rstrip": false,
|
| 704 |
+
"single_word": false,
|
| 705 |
+
"special": false
|
| 706 |
+
},
|
| 707 |
+
"50340": {
|
| 708 |
+
"content": "[unused55]",
|
| 709 |
+
"lstrip": false,
|
| 710 |
+
"normalized": true,
|
| 711 |
+
"rstrip": false,
|
| 712 |
+
"single_word": false,
|
| 713 |
+
"special": false
|
| 714 |
+
},
|
| 715 |
+
"50341": {
|
| 716 |
+
"content": "[unused56]",
|
| 717 |
+
"lstrip": false,
|
| 718 |
+
"normalized": true,
|
| 719 |
+
"rstrip": false,
|
| 720 |
+
"single_word": false,
|
| 721 |
+
"special": false
|
| 722 |
+
},
|
| 723 |
+
"50342": {
|
| 724 |
+
"content": "[unused57]",
|
| 725 |
+
"lstrip": false,
|
| 726 |
+
"normalized": true,
|
| 727 |
+
"rstrip": false,
|
| 728 |
+
"single_word": false,
|
| 729 |
+
"special": false
|
| 730 |
+
},
|
| 731 |
+
"50343": {
|
| 732 |
+
"content": "[unused58]",
|
| 733 |
+
"lstrip": false,
|
| 734 |
+
"normalized": true,
|
| 735 |
+
"rstrip": false,
|
| 736 |
+
"single_word": false,
|
| 737 |
+
"special": false
|
| 738 |
+
},
|
| 739 |
+
"50344": {
|
| 740 |
+
"content": "[unused59]",
|
| 741 |
+
"lstrip": false,
|
| 742 |
+
"normalized": true,
|
| 743 |
+
"rstrip": false,
|
| 744 |
+
"single_word": false,
|
| 745 |
+
"special": false
|
| 746 |
+
},
|
| 747 |
+
"50345": {
|
| 748 |
+
"content": "[unused60]",
|
| 749 |
+
"lstrip": false,
|
| 750 |
+
"normalized": true,
|
| 751 |
+
"rstrip": false,
|
| 752 |
+
"single_word": false,
|
| 753 |
+
"special": false
|
| 754 |
+
},
|
| 755 |
+
"50346": {
|
| 756 |
+
"content": "[unused61]",
|
| 757 |
+
"lstrip": false,
|
| 758 |
+
"normalized": true,
|
| 759 |
+
"rstrip": false,
|
| 760 |
+
"single_word": false,
|
| 761 |
+
"special": false
|
| 762 |
+
},
|
| 763 |
+
"50347": {
|
| 764 |
+
"content": "[unused62]",
|
| 765 |
+
"lstrip": false,
|
| 766 |
+
"normalized": true,
|
| 767 |
+
"rstrip": false,
|
| 768 |
+
"single_word": false,
|
| 769 |
+
"special": false
|
| 770 |
+
},
|
| 771 |
+
"50348": {
|
| 772 |
+
"content": "[unused63]",
|
| 773 |
+
"lstrip": false,
|
| 774 |
+
"normalized": true,
|
| 775 |
+
"rstrip": false,
|
| 776 |
+
"single_word": false,
|
| 777 |
+
"special": false
|
| 778 |
+
},
|
| 779 |
+
"50349": {
|
| 780 |
+
"content": "[unused64]",
|
| 781 |
+
"lstrip": false,
|
| 782 |
+
"normalized": true,
|
| 783 |
+
"rstrip": false,
|
| 784 |
+
"single_word": false,
|
| 785 |
+
"special": false
|
| 786 |
+
},
|
| 787 |
+
"50350": {
|
| 788 |
+
"content": "[unused65]",
|
| 789 |
+
"lstrip": false,
|
| 790 |
+
"normalized": true,
|
| 791 |
+
"rstrip": false,
|
| 792 |
+
"single_word": false,
|
| 793 |
+
"special": false
|
| 794 |
+
},
|
| 795 |
+
"50351": {
|
| 796 |
+
"content": "[unused66]",
|
| 797 |
+
"lstrip": false,
|
| 798 |
+
"normalized": true,
|
| 799 |
+
"rstrip": false,
|
| 800 |
+
"single_word": false,
|
| 801 |
+
"special": false
|
| 802 |
+
},
|
| 803 |
+
"50352": {
|
| 804 |
+
"content": "[unused67]",
|
| 805 |
+
"lstrip": false,
|
| 806 |
+
"normalized": true,
|
| 807 |
+
"rstrip": false,
|
| 808 |
+
"single_word": false,
|
| 809 |
+
"special": false
|
| 810 |
+
},
|
| 811 |
+
"50353": {
|
| 812 |
+
"content": "[unused68]",
|
| 813 |
+
"lstrip": false,
|
| 814 |
+
"normalized": true,
|
| 815 |
+
"rstrip": false,
|
| 816 |
+
"single_word": false,
|
| 817 |
+
"special": false
|
| 818 |
+
},
|
| 819 |
+
"50354": {
|
| 820 |
+
"content": "[unused69]",
|
| 821 |
+
"lstrip": false,
|
| 822 |
+
"normalized": true,
|
| 823 |
+
"rstrip": false,
|
| 824 |
+
"single_word": false,
|
| 825 |
+
"special": false
|
| 826 |
+
},
|
| 827 |
+
"50355": {
|
| 828 |
+
"content": "[unused70]",
|
| 829 |
+
"lstrip": false,
|
| 830 |
+
"normalized": true,
|
| 831 |
+
"rstrip": false,
|
| 832 |
+
"single_word": false,
|
| 833 |
+
"special": false
|
| 834 |
+
},
|
| 835 |
+
"50356": {
|
| 836 |
+
"content": "[unused71]",
|
| 837 |
+
"lstrip": false,
|
| 838 |
+
"normalized": true,
|
| 839 |
+
"rstrip": false,
|
| 840 |
+
"single_word": false,
|
| 841 |
+
"special": false
|
| 842 |
+
},
|
| 843 |
+
"50357": {
|
| 844 |
+
"content": "[unused72]",
|
| 845 |
+
"lstrip": false,
|
| 846 |
+
"normalized": true,
|
| 847 |
+
"rstrip": false,
|
| 848 |
+
"single_word": false,
|
| 849 |
+
"special": false
|
| 850 |
+
},
|
| 851 |
+
"50358": {
|
| 852 |
+
"content": "[unused73]",
|
| 853 |
+
"lstrip": false,
|
| 854 |
+
"normalized": true,
|
| 855 |
+
"rstrip": false,
|
| 856 |
+
"single_word": false,
|
| 857 |
+
"special": false
|
| 858 |
+
},
|
| 859 |
+
"50359": {
|
| 860 |
+
"content": "[unused74]",
|
| 861 |
+
"lstrip": false,
|
| 862 |
+
"normalized": true,
|
| 863 |
+
"rstrip": false,
|
| 864 |
+
"single_word": false,
|
| 865 |
+
"special": false
|
| 866 |
+
},
|
| 867 |
+
"50360": {
|
| 868 |
+
"content": "[unused75]",
|
| 869 |
+
"lstrip": false,
|
| 870 |
+
"normalized": true,
|
| 871 |
+
"rstrip": false,
|
| 872 |
+
"single_word": false,
|
| 873 |
+
"special": false
|
| 874 |
+
},
|
| 875 |
+
"50361": {
|
| 876 |
+
"content": "[unused76]",
|
| 877 |
+
"lstrip": false,
|
| 878 |
+
"normalized": true,
|
| 879 |
+
"rstrip": false,
|
| 880 |
+
"single_word": false,
|
| 881 |
+
"special": false
|
| 882 |
+
},
|
| 883 |
+
"50362": {
|
| 884 |
+
"content": "[unused77]",
|
| 885 |
+
"lstrip": false,
|
| 886 |
+
"normalized": true,
|
| 887 |
+
"rstrip": false,
|
| 888 |
+
"single_word": false,
|
| 889 |
+
"special": false
|
| 890 |
+
},
|
| 891 |
+
"50363": {
|
| 892 |
+
"content": "[unused78]",
|
| 893 |
+
"lstrip": false,
|
| 894 |
+
"normalized": true,
|
| 895 |
+
"rstrip": false,
|
| 896 |
+
"single_word": false,
|
| 897 |
+
"special": false
|
| 898 |
+
},
|
| 899 |
+
"50364": {
|
| 900 |
+
"content": "[unused79]",
|
| 901 |
+
"lstrip": false,
|
| 902 |
+
"normalized": true,
|
| 903 |
+
"rstrip": false,
|
| 904 |
+
"single_word": false,
|
| 905 |
+
"special": false
|
| 906 |
+
},
|
| 907 |
+
"50365": {
|
| 908 |
+
"content": "[unused80]",
|
| 909 |
+
"lstrip": false,
|
| 910 |
+
"normalized": true,
|
| 911 |
+
"rstrip": false,
|
| 912 |
+
"single_word": false,
|
| 913 |
+
"special": false
|
| 914 |
+
},
|
| 915 |
+
"50366": {
|
| 916 |
+
"content": "[unused81]",
|
| 917 |
+
"lstrip": false,
|
| 918 |
+
"normalized": true,
|
| 919 |
+
"rstrip": false,
|
| 920 |
+
"single_word": false,
|
| 921 |
+
"special": false
|
| 922 |
+
},
|
| 923 |
+
"50367": {
|
| 924 |
+
"content": "[unused82]",
|
| 925 |
+
"lstrip": false,
|
| 926 |
+
"normalized": true,
|
| 927 |
+
"rstrip": false,
|
| 928 |
+
"single_word": false,
|
| 929 |
+
"special": false
|
| 930 |
+
}
|
| 931 |
+
},
|
| 932 |
+
"clean_up_tokenization_spaces": true,
|
| 933 |
+
"cls_token": "[CLS]",
|
| 934 |
+
"extra_special_tokens": {},
|
| 935 |
+
"mask_token": "[MASK]",
|
| 936 |
+
"max_length": 512,
|
| 937 |
+
"model_input_names": [
|
| 938 |
+
"input_ids",
|
| 939 |
+
"attention_mask"
|
| 940 |
+
],
|
| 941 |
+
"model_max_length": 8192,
|
| 942 |
+
"pad_to_multiple_of": null,
|
| 943 |
+
"pad_token": "[PAD]",
|
| 944 |
+
"pad_token_type_id": 0,
|
| 945 |
+
"padding_side": "right",
|
| 946 |
+
"sep_token": "[SEP]",
|
| 947 |
+
"stride": 0,
|
| 948 |
+
"tokenizer_class": "PreTrainedTokenizerFast",
|
| 949 |
+
"truncation_side": "right",
|
| 950 |
+
"truncation_strategy": "longest_first",
|
| 951 |
+
"unk_token": "[UNK]"
|
| 952 |
+
}
|
training_args.json
ADDED
|
@@ -0,0 +1,200 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"model_args": {
|
| 3 |
+
"model_name_or_path": "Alibaba-NLP/gte-reranker-modernbert-base",
|
| 4 |
+
"num_labels": null,
|
| 5 |
+
"classifier_dropout": 0.0,
|
| 6 |
+
"max_length": 512,
|
| 7 |
+
"config_name": null,
|
| 8 |
+
"tokenizer_name": null,
|
| 9 |
+
"cache_dir": null
|
| 10 |
+
},
|
| 11 |
+
"data_args": {
|
| 12 |
+
"dataset_name": "hotchpotch/wip-msmarco-context-relevance",
|
| 13 |
+
"subset": "msmarco-ja-minimal",
|
| 14 |
+
"teacher_column": null,
|
| 15 |
+
"datasets": [
|
| 16 |
+
{
|
| 17 |
+
"dataset_name": "hotchpotch/msmarco-context-relevance",
|
| 18 |
+
"subset": "freq2",
|
| 19 |
+
"teacher_column": "teacher_scores.gte-reranker-modernbert-base"
|
| 20 |
+
},
|
| 21 |
+
{
|
| 22 |
+
"dataset_name": "hotchpotch/natural-questions-context-relevance",
|
| 23 |
+
"subset": "nodup_freq2",
|
| 24 |
+
"teacher_column": "teacher_scores.gte-reranker-modernbert-base",
|
| 25 |
+
"items": 6
|
| 26 |
+
},
|
| 27 |
+
{
|
| 28 |
+
"dataset_name": "hotchpotch/gooaq-context-relevance-130k",
|
| 29 |
+
"subset": "default",
|
| 30 |
+
"teacher_column": "teacher_scores.gte-reranker-modernbert-base",
|
| 31 |
+
"items": 6
|
| 32 |
+
}
|
| 33 |
+
],
|
| 34 |
+
"items": null,
|
| 35 |
+
"max_train_samples": null,
|
| 36 |
+
"max_eval_samples": null,
|
| 37 |
+
"validation_split": null,
|
| 38 |
+
"validation_split_samples": null,
|
| 39 |
+
"validation_split_name": "validation",
|
| 40 |
+
"preprocessing_num_workers": null,
|
| 41 |
+
"filter_zero_relevance_max_items": null,
|
| 42 |
+
"filter_zero_relevance_max_items_reverse": false,
|
| 43 |
+
"filter_keep_first_item": false,
|
| 44 |
+
"upsample_factor": null
|
| 45 |
+
},
|
| 46 |
+
"training_args": {
|
| 47 |
+
"output_dir": "./output/freq-open-provence-reranker-v1_20251027_092433",
|
| 48 |
+
"overwrite_output_dir": true,
|
| 49 |
+
"do_train": true,
|
| 50 |
+
"do_eval": true,
|
| 51 |
+
"do_predict": false,
|
| 52 |
+
"eval_strategy": "steps",
|
| 53 |
+
"prediction_loss_only": false,
|
| 54 |
+
"per_device_train_batch_size": 4,
|
| 55 |
+
"per_device_eval_batch_size": 16,
|
| 56 |
+
"per_gpu_train_batch_size": null,
|
| 57 |
+
"per_gpu_eval_batch_size": null,
|
| 58 |
+
"gradient_accumulation_steps": 64,
|
| 59 |
+
"eval_accumulation_steps": null,
|
| 60 |
+
"eval_delay": 0,
|
| 61 |
+
"torch_empty_cache_steps": null,
|
| 62 |
+
"learning_rate": 5e-05,
|
| 63 |
+
"weight_decay": 0.01,
|
| 64 |
+
"adam_beta1": 0.9,
|
| 65 |
+
"adam_beta2": 0.999,
|
| 66 |
+
"adam_epsilon": 1e-08,
|
| 67 |
+
"max_grad_norm": 1.0,
|
| 68 |
+
"num_train_epochs": 1,
|
| 69 |
+
"max_steps": -1,
|
| 70 |
+
"lr_scheduler_type": "cosine",
|
| 71 |
+
"lr_scheduler_kwargs": {},
|
| 72 |
+
"warmup_ratio": 0.1,
|
| 73 |
+
"warmup_steps": 0,
|
| 74 |
+
"log_level": "passive",
|
| 75 |
+
"log_level_replica": "warning",
|
| 76 |
+
"log_on_each_node": true,
|
| 77 |
+
"logging_dir": "trainer_output/runs/Oct27_09-24-33_yuix",
|
| 78 |
+
"logging_strategy": "steps",
|
| 79 |
+
"logging_first_step": false,
|
| 80 |
+
"logging_steps": 15,
|
| 81 |
+
"logging_nan_inf_filter": true,
|
| 82 |
+
"save_strategy": "steps",
|
| 83 |
+
"save_steps": 500,
|
| 84 |
+
"save_total_limit": 5,
|
| 85 |
+
"save_safetensors": true,
|
| 86 |
+
"save_on_each_node": false,
|
| 87 |
+
"save_only_model": false,
|
| 88 |
+
"restore_callback_states_from_checkpoint": false,
|
| 89 |
+
"no_cuda": false,
|
| 90 |
+
"use_cpu": false,
|
| 91 |
+
"use_mps_device": false,
|
| 92 |
+
"seed": 42,
|
| 93 |
+
"data_seed": null,
|
| 94 |
+
"jit_mode_eval": false,
|
| 95 |
+
"bf16": true,
|
| 96 |
+
"fp16": false,
|
| 97 |
+
"fp16_opt_level": "O1",
|
| 98 |
+
"half_precision_backend": "auto",
|
| 99 |
+
"bf16_full_eval": false,
|
| 100 |
+
"fp16_full_eval": false,
|
| 101 |
+
"tf32": null,
|
| 102 |
+
"local_rank": 0,
|
| 103 |
+
"ddp_backend": null,
|
| 104 |
+
"tpu_num_cores": null,
|
| 105 |
+
"tpu_metrics_debug": false,
|
| 106 |
+
"debug": [],
|
| 107 |
+
"dataloader_drop_last": false,
|
| 108 |
+
"eval_steps": 77,
|
| 109 |
+
"dataloader_num_workers": 8,
|
| 110 |
+
"dataloader_prefetch_factor": null,
|
| 111 |
+
"past_index": -1,
|
| 112 |
+
"run_name": "freq-open-provence-reranker-v1-20251027_092433",
|
| 113 |
+
"disable_tqdm": false,
|
| 114 |
+
"remove_unused_columns": false,
|
| 115 |
+
"label_names": null,
|
| 116 |
+
"load_best_model_at_end": true,
|
| 117 |
+
"metric_for_best_model": "eval_loss",
|
| 118 |
+
"greater_is_better": false,
|
| 119 |
+
"ignore_data_skip": false,
|
| 120 |
+
"fsdp": [],
|
| 121 |
+
"fsdp_min_num_params": 0,
|
| 122 |
+
"fsdp_config": {
|
| 123 |
+
"min_num_params": 0,
|
| 124 |
+
"xla": false,
|
| 125 |
+
"xla_fsdp_v2": false,
|
| 126 |
+
"xla_fsdp_grad_ckpt": false
|
| 127 |
+
},
|
| 128 |
+
"fsdp_transformer_layer_cls_to_wrap": null,
|
| 129 |
+
"accelerator_config": "AcceleratorConfig(split_batches=False, dispatch_batches=None, even_batches=True, use_seedable_sampler=True, non_blocking=False, gradient_accumulation_kwargs=None, use_configured_state=False)",
|
| 130 |
+
"parallelism_config": null,
|
| 131 |
+
"deepspeed": null,
|
| 132 |
+
"label_smoothing_factor": 0.0,
|
| 133 |
+
"optim": "adafactor",
|
| 134 |
+
"optim_args": null,
|
| 135 |
+
"adafactor": false,
|
| 136 |
+
"group_by_length": false,
|
| 137 |
+
"length_column_name": "length",
|
| 138 |
+
"report_to": [
|
| 139 |
+
"wandb"
|
| 140 |
+
],
|
| 141 |
+
"project": "huggingface",
|
| 142 |
+
"trackio_space_id": "trackio",
|
| 143 |
+
"ddp_find_unused_parameters": null,
|
| 144 |
+
"ddp_bucket_cap_mb": null,
|
| 145 |
+
"ddp_broadcast_buffers": null,
|
| 146 |
+
"dataloader_pin_memory": true,
|
| 147 |
+
"dataloader_persistent_workers": false,
|
| 148 |
+
"skip_memory_metrics": true,
|
| 149 |
+
"use_legacy_prediction_loop": false,
|
| 150 |
+
"push_to_hub": false,
|
| 151 |
+
"resume_from_checkpoint": null,
|
| 152 |
+
"hub_model_id": null,
|
| 153 |
+
"hub_strategy": "every_save",
|
| 154 |
+
"hub_token": null,
|
| 155 |
+
"hub_private_repo": null,
|
| 156 |
+
"hub_always_push": false,
|
| 157 |
+
"hub_revision": null,
|
| 158 |
+
"gradient_checkpointing": false,
|
| 159 |
+
"gradient_checkpointing_kwargs": null,
|
| 160 |
+
"include_inputs_for_metrics": false,
|
| 161 |
+
"include_for_metrics": [],
|
| 162 |
+
"eval_do_concat_batches": true,
|
| 163 |
+
"fp16_backend": "auto",
|
| 164 |
+
"push_to_hub_model_id": null,
|
| 165 |
+
"push_to_hub_organization": null,
|
| 166 |
+
"push_to_hub_token": null,
|
| 167 |
+
"mp_parameters": "",
|
| 168 |
+
"auto_find_batch_size": false,
|
| 169 |
+
"full_determinism": false,
|
| 170 |
+
"torchdynamo": null,
|
| 171 |
+
"ray_scope": "last",
|
| 172 |
+
"ddp_timeout": 1800,
|
| 173 |
+
"torch_compile": false,
|
| 174 |
+
"torch_compile_backend": null,
|
| 175 |
+
"torch_compile_mode": null,
|
| 176 |
+
"include_tokens_per_second": false,
|
| 177 |
+
"include_num_input_tokens_seen": "no",
|
| 178 |
+
"neftune_noise_alpha": null,
|
| 179 |
+
"optim_target_modules": null,
|
| 180 |
+
"batch_eval_metrics": false,
|
| 181 |
+
"eval_on_start": false,
|
| 182 |
+
"use_liger_kernel": false,
|
| 183 |
+
"liger_kernel_config": null,
|
| 184 |
+
"eval_use_gather_object": false,
|
| 185 |
+
"average_tokens_across_devices": true,
|
| 186 |
+
"ranking_weight": 0.05,
|
| 187 |
+
"pruning_weight": 1.0,
|
| 188 |
+
"use_teacher_scores": true,
|
| 189 |
+
"sentence_level_pruning": true,
|
| 190 |
+
"standalone_process_default_language": "en",
|
| 191 |
+
"eval_datasets": {
|
| 192 |
+
"config": "configs/eval_datasets/en.yaml",
|
| 193 |
+
"threshold": 0.1,
|
| 194 |
+
"batch_size": 32
|
| 195 |
+
},
|
| 196 |
+
"distributed_state": "Distributed environment: DistributedType.NO\nNum processes: 1\nProcess index: 0\nLocal process index: 0\nDevice: cuda\n",
|
| 197 |
+
"deepspeed_plugin": null,
|
| 198 |
+
"modeling_open_provence_default_language": "en"
|
| 199 |
+
}
|
| 200 |
+
}
|