File size: 3,504 Bytes
800b2b6
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2c897f3
f7a50a0
2c897f3
800b2b6
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2c897f3
f7a50a0
2c897f3
f7a50a0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
800b2b6
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
{
    "average_CPS": 7.3897435,
    "config": {
        "model_name": "HiTZ/Medical-mT5-large",
        "num_fewshot": "10",
        "batch_size": 1,
        "LANG": "GR",
        "model": "HiTZ/Medical-mT5-large",
        "base_model": "MT5ForConditionalGeneration",
        "revision": "e8ae7101f0ab1ed5b8add8846e44a2d39f6e2c47",
        "submitted_time": "2023-10-31 15:15:15+00:00",
        "num_params_billion": null,
        "language": "en_es_fr_it"
    },
    "tasks": {
        "NER": {
            "prompts": [
                {
                    "prompt": "p1",
                    "metric": "f1",
                    "value": 14.549999999999999,
                    "stderr": 0.0
                },
                {
                    "prompt": "p2",
                    "metric": "f1",
                    "value": 14.34,
                    "stderr": 0.0
                },
                {
                    "prompt": "p3",
                    "metric": "f1",
                    "value": 14.549999999999999,
                    "stderr": 0.0
                }
            ],
            "average_accuracy": 14.479999999999999,
            "best_prompt": 14.549999999999999,
            "prompt_id": "p1",
            "CPS": 14.539814999999999,
            "is_dummy": false,
            "std_accuracy": 0.12124355652982088
        },
        "RE": {
            "prompts": [
                {
                    "prompt": "p1",
                    "metric": "f1",
                    "value": 0.24,
                    "stderr": 0.0
                },
                {
                    "prompt": "p2",
                    "metric": "f1",
                    "value": 0.06999999999999999,
                    "stderr": 0.0
                },
                {
                    "prompt": "p3",
                    "metric": "f1",
                    "value": 0.0,
                    "stderr": 0.0
                }
            ],
            "average_accuracy": 0.10333333333333333,
            "best_prompt": 0.24,
            "prompt_id": "p1",
            "CPS": 0.239672,
            "is_dummy": false,
            "std_accuracy": 0.12342339054382412
        },
        "RML": {
            "prompts": [
                {
                    "prompt": "p1",
                    "metric": "f1",
                    "value": 0.0,
                    "stderr": 0.0
                }
            ],
            "average_accuracy": null,
            "std_accuracy": null,
            "best_prompt": null,
            "prompt_id": null,
            "CPS": null,
            "is_dummy": true
        },
        "HIS": {
            "prompts": [
                {
                    "prompt": "p1",
                    "metric": "f1",
                    "value": 0.0,
                    "stderr": 0.0
                }
            ],
            "average_accuracy": null,
            "std_accuracy": null,
            "best_prompt": null,
            "prompt_id": null,
            "CPS": null,
            "is_dummy": true
        },
        "DIA": {
            "prompts": [
                {
                    "prompt": "p1",
                    "metric": "f1",
                    "value": 0.0,
                    "stderr": 0.0
                }
            ],
            "average_accuracy": null,
            "std_accuracy": null,
            "best_prompt": null,
            "prompt_id": null,
            "CPS": null,
            "is_dummy": true
        }
    }
}