Model save
Browse files- README.md +74 -74
- emissions.csv +2 -1
- runs/Jun05_14-24-25_Tom/events.out.tfevents.1717590271.Tom.22032.0 +2 -2
README.md
CHANGED
|
@@ -63,14 +63,14 @@ widget:
|
|
| 63 |
- I don't know how cold it got last night.
|
| 64 |
pipeline_tag: sentence-similarity
|
| 65 |
co2_eq_emissions:
|
| 66 |
-
emissions: 6.
|
| 67 |
-
energy_consumed: 0.
|
| 68 |
source: codecarbon
|
| 69 |
training_type: fine-tuning
|
| 70 |
on_cloud: false
|
| 71 |
cpu_model: 13th Gen Intel(R) Core(TM) i7-13700K
|
| 72 |
ram_total_size: 31.777088165283203
|
| 73 |
-
hours_used: 0.
|
| 74 |
hardware_used: 1 x NVIDIA GeForce RTX 3090
|
| 75 |
model-index:
|
| 76 |
- name: SentenceTransformer based on microsoft/mpnet-base
|
|
@@ -83,34 +83,34 @@ model-index:
|
|
| 83 |
type: sts-dev
|
| 84 |
metrics:
|
| 85 |
- type: pearson_cosine
|
| 86 |
-
value: 0.
|
| 87 |
name: Pearson Cosine
|
| 88 |
- type: spearman_cosine
|
| 89 |
-
value: 0.
|
| 90 |
name: Spearman Cosine
|
| 91 |
- type: pearson_manhattan
|
| 92 |
-
value: 0.
|
| 93 |
name: Pearson Manhattan
|
| 94 |
- type: spearman_manhattan
|
| 95 |
-
value: 0.
|
| 96 |
name: Spearman Manhattan
|
| 97 |
- type: pearson_euclidean
|
| 98 |
-
value: 0.
|
| 99 |
name: Pearson Euclidean
|
| 100 |
- type: spearman_euclidean
|
| 101 |
-
value: 0.
|
| 102 |
name: Spearman Euclidean
|
| 103 |
- type: pearson_dot
|
| 104 |
-
value: 0.
|
| 105 |
name: Pearson Dot
|
| 106 |
- type: spearman_dot
|
| 107 |
-
value: 0.
|
| 108 |
name: Spearman Dot
|
| 109 |
- type: pearson_max
|
| 110 |
-
value: 0.
|
| 111 |
name: Pearson Max
|
| 112 |
- type: spearman_max
|
| 113 |
-
value: 0.
|
| 114 |
name: Spearman Max
|
| 115 |
- task:
|
| 116 |
type: semantic-similarity
|
|
@@ -120,34 +120,34 @@ model-index:
|
|
| 120 |
type: sts-test
|
| 121 |
metrics:
|
| 122 |
- type: pearson_cosine
|
| 123 |
-
value: 0.
|
| 124 |
name: Pearson Cosine
|
| 125 |
- type: spearman_cosine
|
| 126 |
-
value: 0.
|
| 127 |
name: Spearman Cosine
|
| 128 |
- type: pearson_manhattan
|
| 129 |
-
value: 0.
|
| 130 |
name: Pearson Manhattan
|
| 131 |
- type: spearman_manhattan
|
| 132 |
-
value: 0.
|
| 133 |
name: Spearman Manhattan
|
| 134 |
- type: pearson_euclidean
|
| 135 |
-
value: 0.
|
| 136 |
name: Pearson Euclidean
|
| 137 |
- type: spearman_euclidean
|
| 138 |
-
value: 0.
|
| 139 |
name: Spearman Euclidean
|
| 140 |
- type: pearson_dot
|
| 141 |
-
value: 0.
|
| 142 |
name: Pearson Dot
|
| 143 |
- type: spearman_dot
|
| 144 |
-
value: 0.
|
| 145 |
name: Spearman Dot
|
| 146 |
- type: pearson_max
|
| 147 |
-
value: 0.
|
| 148 |
name: Pearson Max
|
| 149 |
- type: spearman_max
|
| 150 |
-
value: 0.
|
| 151 |
name: Spearman Max
|
| 152 |
---
|
| 153 |
|
|
@@ -252,16 +252,16 @@ You can finetune this model on your own dataset.
|
|
| 252 |
|
| 253 |
| Metric | Value |
|
| 254 |
|:-------------------|:-----------|
|
| 255 |
-
| pearson_cosine | 0.
|
| 256 |
-
| spearman_cosine | 0.
|
| 257 |
-
| pearson_manhattan | 0.
|
| 258 |
-
| spearman_manhattan | 0.
|
| 259 |
-
| pearson_euclidean | 0.
|
| 260 |
-
| spearman_euclidean | 0.
|
| 261 |
-
| pearson_dot | 0.
|
| 262 |
-
| **spearman_dot** | **0.
|
| 263 |
-
| pearson_max | 0.
|
| 264 |
-
| spearman_max | 0.
|
| 265 |
|
| 266 |
#### Semantic Similarity
|
| 267 |
* Dataset: `sts-test`
|
|
@@ -269,16 +269,16 @@ You can finetune this model on your own dataset.
|
|
| 269 |
|
| 270 |
| Metric | Value |
|
| 271 |
|:--------------------|:-----------|
|
| 272 |
-
| pearson_cosine | 0.
|
| 273 |
-
| **spearman_cosine** | **0.
|
| 274 |
-
| pearson_manhattan | 0.
|
| 275 |
-
| spearman_manhattan | 0.
|
| 276 |
-
| pearson_euclidean | 0.
|
| 277 |
-
| spearman_euclidean | 0.
|
| 278 |
-
| pearson_dot | 0.
|
| 279 |
-
| spearman_dot | 0.
|
| 280 |
-
| pearson_max | 0.
|
| 281 |
-
| spearman_max | 0.
|
| 282 |
|
| 283 |
<!--
|
| 284 |
## Bias, Risks and Limitations
|
|
@@ -548,43 +548,43 @@ You can finetune this model on your own dataset.
|
|
| 548 |
</details>
|
| 549 |
|
| 550 |
### Training Logs
|
| 551 |
-
| Epoch | Step | Training Loss |
|
| 552 |
-
|
| 553 |
-
| 0.0370 | 10 | 0.
|
| 554 |
-
| 0.0741 | 20 | 0.
|
| 555 |
-
| 0.1111 | 30 | 0.
|
| 556 |
-
| 0.1481 | 40 | 0.
|
| 557 |
-
| 0.1852 | 50 | 0.
|
| 558 |
-
| 0.2222 | 60 | 0.
|
| 559 |
-
| 0.2593 | 70 | 0.
|
| 560 |
-
| 0.2963 | 80 | 0.
|
| 561 |
-
| 0.3333 | 90 | 0.
|
| 562 |
-
| 0.3704 | 100 | 0.
|
| 563 |
-
| 0.4074 | 110 | 0.
|
| 564 |
-
| 0.4444 | 120 | 0.
|
| 565 |
-
| 0.4815 | 130 | 0.
|
| 566 |
-
| 0.5185 | 140 | 0.
|
| 567 |
-
| 0.5556 | 150 | 0.
|
| 568 |
-
| 0.5926 | 160 | 0.
|
| 569 |
-
| 0.6296 | 170 | 0.
|
| 570 |
-
| 0.6667 | 180 | 0.
|
| 571 |
-
| 0.7037 | 190 | 0.
|
| 572 |
-
| 0.7407 | 200 | 0.
|
| 573 |
-
| 0.7778
|
| 574 |
-
| 0.8148 | 220 | 0.
|
| 575 |
-
| 0.8519 | 230 | 0.
|
| 576 |
-
|
|
| 577 |
-
| 0.9259 | 250 | 0.
|
| 578 |
-
| 0.9630 | 260 | 0.
|
| 579 |
-
| 1.0 | 270 | 0.
|
| 580 |
|
| 581 |
* The bold row denotes the saved checkpoint.
|
| 582 |
|
| 583 |
### Environmental Impact
|
| 584 |
Carbon emissions were measured using [CodeCarbon](https://github.com/mlco2/codecarbon).
|
| 585 |
-
- **Energy Consumed**: 0.
|
| 586 |
- **Carbon Emitted**: 0.007 kg of CO2
|
| 587 |
-
- **Hours Used**: 0.
|
| 588 |
|
| 589 |
### Training Hardware
|
| 590 |
- **On Cloud**: No
|
|
|
|
| 63 |
- I don't know how cold it got last night.
|
| 64 |
pipeline_tag: sentence-similarity
|
| 65 |
co2_eq_emissions:
|
| 66 |
+
emissions: 6.863209894681815
|
| 67 |
+
energy_consumed: 0.017656739339344318
|
| 68 |
source: codecarbon
|
| 69 |
training_type: fine-tuning
|
| 70 |
on_cloud: false
|
| 71 |
cpu_model: 13th Gen Intel(R) Core(TM) i7-13700K
|
| 72 |
ram_total_size: 31.777088165283203
|
| 73 |
+
hours_used: 0.068
|
| 74 |
hardware_used: 1 x NVIDIA GeForce RTX 3090
|
| 75 |
model-index:
|
| 76 |
- name: SentenceTransformer based on microsoft/mpnet-base
|
|
|
|
| 83 |
type: sts-dev
|
| 84 |
metrics:
|
| 85 |
- type: pearson_cosine
|
| 86 |
+
value: 0.8344104750902503
|
| 87 |
name: Pearson Cosine
|
| 88 |
- type: spearman_cosine
|
| 89 |
+
value: 0.8294923795333993
|
| 90 |
name: Spearman Cosine
|
| 91 |
- type: pearson_manhattan
|
| 92 |
+
value: 0.8316959259914674
|
| 93 |
name: Pearson Manhattan
|
| 94 |
- type: spearman_manhattan
|
| 95 |
+
value: 0.8331844817222047
|
| 96 |
name: Spearman Manhattan
|
| 97 |
- type: pearson_euclidean
|
| 98 |
+
value: 0.8272941934077804
|
| 99 |
name: Pearson Euclidean
|
| 100 |
- type: spearman_euclidean
|
| 101 |
+
value: 0.8294923795333993
|
| 102 |
name: Spearman Euclidean
|
| 103 |
- type: pearson_dot
|
| 104 |
+
value: 0.8344104825648291
|
| 105 |
name: Pearson Dot
|
| 106 |
- type: spearman_dot
|
| 107 |
+
value: 0.8294923795333993
|
| 108 |
name: Spearman Dot
|
| 109 |
- type: pearson_max
|
| 110 |
+
value: 0.8344104825648291
|
| 111 |
name: Pearson Max
|
| 112 |
- type: spearman_max
|
| 113 |
+
value: 0.8331844817222047
|
| 114 |
name: Spearman Max
|
| 115 |
- task:
|
| 116 |
type: semantic-similarity
|
|
|
|
| 120 |
type: sts-test
|
| 121 |
metrics:
|
| 122 |
- type: pearson_cosine
|
| 123 |
+
value: 0.7776062173443514
|
| 124 |
name: Pearson Cosine
|
| 125 |
- type: spearman_cosine
|
| 126 |
+
value: 0.7642518713703523
|
| 127 |
name: Spearman Cosine
|
| 128 |
- type: pearson_manhattan
|
| 129 |
+
value: 0.7788269653910183
|
| 130 |
name: Pearson Manhattan
|
| 131 |
- type: spearman_manhattan
|
| 132 |
+
value: 0.7659203139768728
|
| 133 |
name: Spearman Manhattan
|
| 134 |
- type: pearson_euclidean
|
| 135 |
+
value: 0.7763456809736229
|
| 136 |
name: Pearson Euclidean
|
| 137 |
- type: spearman_euclidean
|
| 138 |
+
value: 0.7642518713703523
|
| 139 |
name: Spearman Euclidean
|
| 140 |
- type: pearson_dot
|
| 141 |
+
value: 0.7776062158976489
|
| 142 |
name: Pearson Dot
|
| 143 |
- type: spearman_dot
|
| 144 |
+
value: 0.7642518713703523
|
| 145 |
name: Spearman Dot
|
| 146 |
- type: pearson_max
|
| 147 |
+
value: 0.7788269653910183
|
| 148 |
name: Pearson Max
|
| 149 |
- type: spearman_max
|
| 150 |
+
value: 0.7659203139768728
|
| 151 |
name: Spearman Max
|
| 152 |
---
|
| 153 |
|
|
|
|
| 252 |
|
| 253 |
| Metric | Value |
|
| 254 |
|:-------------------|:-----------|
|
| 255 |
+
| pearson_cosine | 0.8344 |
|
| 256 |
+
| spearman_cosine | 0.8295 |
|
| 257 |
+
| pearson_manhattan | 0.8317 |
|
| 258 |
+
| spearman_manhattan | 0.8332 |
|
| 259 |
+
| pearson_euclidean | 0.8273 |
|
| 260 |
+
| spearman_euclidean | 0.8295 |
|
| 261 |
+
| pearson_dot | 0.8344 |
|
| 262 |
+
| **spearman_dot** | **0.8295** |
|
| 263 |
+
| pearson_max | 0.8344 |
|
| 264 |
+
| spearman_max | 0.8332 |
|
| 265 |
|
| 266 |
#### Semantic Similarity
|
| 267 |
* Dataset: `sts-test`
|
|
|
|
| 269 |
|
| 270 |
| Metric | Value |
|
| 271 |
|:--------------------|:-----------|
|
| 272 |
+
| pearson_cosine | 0.7776 |
|
| 273 |
+
| **spearman_cosine** | **0.7643** |
|
| 274 |
+
| pearson_manhattan | 0.7788 |
|
| 275 |
+
| spearman_manhattan | 0.7659 |
|
| 276 |
+
| pearson_euclidean | 0.7763 |
|
| 277 |
+
| spearman_euclidean | 0.7643 |
|
| 278 |
+
| pearson_dot | 0.7776 |
|
| 279 |
+
| spearman_dot | 0.7643 |
|
| 280 |
+
| pearson_max | 0.7788 |
|
| 281 |
+
| spearman_max | 0.7659 |
|
| 282 |
|
| 283 |
<!--
|
| 284 |
## Bias, Risks and Limitations
|
|
|
|
| 548 |
</details>
|
| 549 |
|
| 550 |
### Training Logs
|
| 551 |
+
| Epoch | Step | Training Loss | multi nli loss | snli loss | stsb loss | sts-dev_spearman_dot | sts-test_spearman_cosine |
|
| 552 |
+
|:----------:|:-------:|:-------------:|:--------------:|:----------:|:----------:|:--------------------:|:------------------------:|
|
| 553 |
+
| 0.0370 | 10 | 0.8347 | - | - | - | - | - |
|
| 554 |
+
| 0.0741 | 20 | 0.8269 | - | - | - | - | - |
|
| 555 |
+
| 0.1111 | 30 | 0.7036 | 1.0978 | 1.0984 | 0.0830 | 0.6636 | - |
|
| 556 |
+
| 0.1481 | 40 | 0.7889 | - | - | - | - | - |
|
| 557 |
+
| 0.1852 | 50 | 0.7948 | - | - | - | - | - |
|
| 558 |
+
| 0.2222 | 60 | 0.688 | 1.0976 | 1.0961 | 0.0679 | 0.7124 | - |
|
| 559 |
+
| 0.2593 | 70 | 0.7911 | - | - | - | - | - |
|
| 560 |
+
| 0.2963 | 80 | 0.7847 | - | - | - | - | - |
|
| 561 |
+
| 0.3333 | 90 | 0.6801 | 1.0950 | 1.0942 | 0.0522 | 0.7810 | - |
|
| 562 |
+
| 0.3704 | 100 | 0.7837 | - | - | - | - | - |
|
| 563 |
+
| 0.4074 | 110 | 0.7803 | - | - | - | - | - |
|
| 564 |
+
| 0.4444 | 120 | 0.6756 | 1.0978 | 1.0929 | 0.0441 | 0.8157 | - |
|
| 565 |
+
| 0.4815 | 130 | 0.7829 | - | - | - | - | - |
|
| 566 |
+
| 0.5185 | 140 | 0.7789 | - | - | - | - | - |
|
| 567 |
+
| 0.5556 | 150 | 0.6756 | 1.0954 | 1.0911 | 0.0433 | 0.8215 | - |
|
| 568 |
+
| 0.5926 | 160 | 0.7802 | - | - | - | - | - |
|
| 569 |
+
| 0.6296 | 170 | 0.7751 | - | - | - | - | - |
|
| 570 |
+
| 0.6667 | 180 | 0.6679 | 1.0934 | 1.0885 | 0.0401 | 0.8235 | - |
|
| 571 |
+
| 0.7037 | 190 | 0.7755 | - | - | - | - | - |
|
| 572 |
+
| 0.7407 | 200 | 0.775 | - | - | - | - | - |
|
| 573 |
+
| **0.7778** | **210** | **0.6694** | **1.0919** | **1.0859** | **0.0377** | **0.8295** | **-** |
|
| 574 |
+
| 0.8148 | 220 | 0.7733 | - | - | - | - | - |
|
| 575 |
+
| 0.8519 | 230 | 0.772 | - | - | - | - | - |
|
| 576 |
+
| 0.8889 | 240 | 0.6656 | 1.0891 | 1.0838 | 0.0365 | 0.8292 | - |
|
| 577 |
+
| 0.9259 | 250 | 0.7726 | - | - | - | - | - |
|
| 578 |
+
| 0.9630 | 260 | 0.7731 | - | - | - | - | - |
|
| 579 |
+
| 1.0 | 270 | 0.6674 | 1.0888 | 1.0833 | 0.0372 | 0.8295 | 0.7643 |
|
| 580 |
|
| 581 |
* The bold row denotes the saved checkpoint.
|
| 582 |
|
| 583 |
### Environmental Impact
|
| 584 |
Carbon emissions were measured using [CodeCarbon](https://github.com/mlco2/codecarbon).
|
| 585 |
+
- **Energy Consumed**: 0.018 kWh
|
| 586 |
- **Carbon Emitted**: 0.007 kg of CO2
|
| 587 |
+
- **Hours Used**: 0.068 hours
|
| 588 |
|
| 589 |
### Training Hardware
|
| 590 |
- **On Cloud**: No
|
emissions.csv
CHANGED
|
@@ -1,3 +1,4 @@
|
|
| 1 |
timestamp,project_name,run_id,duration,emissions,emissions_rate,cpu_power,gpu_power,ram_power,cpu_energy,gpu_energy,ram_energy,energy_consumed,country_name,country_iso_code,region,cloud_provider,cloud_region,os,python_version,codecarbon_version,cpu_count,cpu_model,gpu_count,gpu_model,longitude,latitude,ram_total_size,tracking_mode,on_cloud,pue
|
| 2 |
2024-06-05T13:25:31,codecarbon,8f78a832-cb8b-4255-90f9-87291ab5a2c5,203.90490198135376,0.0066664767107362,3.269404828406667e-05,42.5,262.78315247135714,11.9164080619812,0.0024072106483909,0.0140688801439834,0.0006745199858985,0.0171506107782729,The Netherlands,NLD,utrecht,,,Windows-10-10.0.22631-SP0,3.11.6,2.3.4,24,13th Gen Intel(R) Core(TM) i7-13700K,1,1 x NVIDIA GeForce RTX 3090,5.0582,52.0756,31.777088165283203,machine,N,1.0
|
| 3 |
-
2024-06-05T14:02:28,codecarbon,c19a4b76-5dda-443e-a1eb-73550f818127,200.
|
|
|
|
|
|
| 1 |
timestamp,project_name,run_id,duration,emissions,emissions_rate,cpu_power,gpu_power,ram_power,cpu_energy,gpu_energy,ram_energy,energy_consumed,country_name,country_iso_code,region,cloud_provider,cloud_region,os,python_version,codecarbon_version,cpu_count,cpu_model,gpu_count,gpu_model,longitude,latitude,ram_total_size,tracking_mode,on_cloud,pue
|
| 2 |
2024-06-05T13:25:31,codecarbon,8f78a832-cb8b-4255-90f9-87291ab5a2c5,203.90490198135376,0.0066664767107362,3.269404828406667e-05,42.5,262.78315247135714,11.9164080619812,0.0024072106483909,0.0140688801439834,0.0006745199858985,0.0171506107782729,The Netherlands,NLD,utrecht,,,Windows-10-10.0.22631-SP0,3.11.6,2.3.4,24,13th Gen Intel(R) Core(TM) i7-13700K,1,1 x NVIDIA GeForce RTX 3090,5.0582,52.0756,31.777088165283203,machine,N,1.0
|
| 3 |
+
2024-06-05T14:02:28,codecarbon,c19a4b76-5dda-443e-a1eb-73550f818127,200.78387594223025,0.0065439122030958,3.259182129235663e-05,42.5,248.66806443178965,11.9164080619812,0.0023703652020957,0.0138007013183294,0.0006642268485203,0.0168352933689455,The Netherlands,NLD,utrecht,,,Windows-10-10.0.22631-SP0,3.11.6,2.3.4,24,13th Gen Intel(R) Core(TM) i7-13700K,1,1 x NVIDIA GeForce RTX 3090,5.0582,52.0756,31.777088165283203,machine,N,1.0
|
| 4 |
+
2024-06-05T14:28:07,codecarbon,8f089da1-33f1-4fca-8f92-14f942b5d735,210.7226061820984,0.006863209894681815,3.256987951615828e-05,42.5,170.86763354628195,11.916408061981201,0.0024876974340942173,0.014472137411034147,0.0006969044942159526,0.017656739339344318,The Netherlands,NLD,utrecht,,,Windows-10-10.0.22631-SP0,3.11.6,2.3.4,24,13th Gen Intel(R) Core(TM) i7-13700K,1,1 x NVIDIA GeForce RTX 3090,5.0582,52.0756,31.777088165283203,machine,N,1.0
|
runs/Jun05_14-24-25_Tom/events.out.tfevents.1717590271.Tom.22032.0
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5daa10416f13952f48a2b55db8df31a9bebe5122191c678dd1a01461154db825
|
| 3 |
+
size 24190
|