bobox
/

DeBERTaV3-small-ST-AdaptiveLayer-Norm-ep2

@@ -89,109 +89,109 @@ model-index:
       type: unknown
     metrics:
     - type: cosine_accuracy
-      value: 0.6605795351645035
       name: Cosine Accuracy
     - type: cosine_accuracy_threshold
-      value: 0.688193678855896
       name: Cosine Accuracy Threshold
     - type: cosine_f1
-      value: 0.7076101468624832
       name: Cosine F1
     - type: cosine_f1_threshold
-      value: 0.5949093103408813
       name: Cosine F1 Threshold
     - type: cosine_precision
-      value: 0.6053997923156802
       name: Cosine Precision
     - type: cosine_recall
-      value: 0.8513434579439252
       name: Cosine Recall
     - type: cosine_ap
-      value: 0.7024412828441404
       name: Cosine Ap
     - type: dot_accuracy
-      value: 0.6320555387865983
       name: Dot Accuracy
     - type: dot_accuracy_threshold
-      value: 152.9224853515625
       name: Dot Accuracy Threshold
     - type: dot_f1
-      value: 0.6979234972677596
       name: Dot F1
     - type: dot_f1_threshold
-      value: 110.95356750488281
       name: Dot F1 Threshold
     - type: dot_precision
-      value: 0.5576318546978694
       name: Dot Precision
     - type: dot_recall
-      value: 0.9325350467289719
       name: Dot Recall
     - type: dot_ap
-      value: 0.6470829330129519
       name: Dot Ap
     - type: manhattan_accuracy
-      value: 0.661334138243284
       name: Manhattan Accuracy
     - type: manhattan_accuracy_threshold
-      value: 235.78744506835938
       name: Manhattan Accuracy Threshold
     - type: manhattan_f1
-      value: 0.7093479035514908
       name: Manhattan F1
     - type: manhattan_f1_threshold
-      value: 285.1435852050781
       name: Manhattan F1 Threshold
     - type: manhattan_precision
-      value: 0.5977977977977978
       name: Manhattan Precision
     - type: manhattan_recall
-      value: 0.8720794392523364
       name: Manhattan Recall
     - type: manhattan_ap
-      value: 0.7110821827765943
       name: Manhattan Ap
     - type: euclidean_accuracy
-      value: 0.6605795351645035
       name: Euclidean Accuracy
     - type: euclidean_accuracy_threshold
-      value: 12.528359413146973
       name: Euclidean Accuracy Threshold
     - type: euclidean_f1
-      value: 0.7051541483156768
       name: Euclidean F1
     - type: euclidean_f1_threshold
-      value: 13.97222900390625
       name: Euclidean F1 Threshold
     - type: euclidean_precision
-      value: 0.5951376331123167
       name: Euclidean Precision
     - type: euclidean_recall
-      value: 0.865070093457944
       name: Euclidean Recall
     - type: euclidean_ap
-      value: 0.7071775256273181
       name: Euclidean Ap
     - type: max_accuracy
-      value: 0.661334138243284
       name: Max Accuracy
     - type: max_accuracy_threshold
-      value: 235.78744506835938
       name: Max Accuracy Threshold
     - type: max_f1
-      value: 0.7093479035514908
       name: Max F1
     - type: max_f1_threshold
-      value: 285.1435852050781
       name: Max F1 Threshold
     - type: max_precision
-      value: 0.6053997923156802
       name: Max Precision
     - type: max_recall
-      value: 0.9325350467289719
       name: Max Recall
     - type: max_ap
-      value: 0.7110821827765943
       name: Max Ap
 ---
@@ -293,41 +293,41 @@ You can finetune this model on your own dataset.
 | Metric                       | Value      |
 |:-----------------------------|:-----------|
-| cosine_accuracy              | 0.6606     |
-| cosine_accuracy_threshold    | 0.6882     |
-| cosine_f1                    | 0.7076     |
-| cosine_f1_threshold          | 0.5949     |
-| cosine_precision             | 0.6054     |
-| cosine_recall                | 0.8513     |
-| cosine_ap                    | 0.7024     |
-| dot_accuracy                 | 0.6321     |
-| dot_accuracy_threshold       | 152.9225   |
-| dot_f1                       | 0.6979     |
-| dot_f1_threshold             | 110.9536   |
-| dot_precision                | 0.5576     |
-| dot_recall                   | 0.9325     |
-| dot_ap                       | 0.6471     |
-| manhattan_accuracy           | 0.6613     |
-| manhattan_accuracy_threshold | 235.7874   |
-| manhattan_f1                 | 0.7093     |
-| manhattan_f1_threshold       | 285.1436   |
-| manhattan_precision          | 0.5978     |
-| manhattan_recall             | 0.8721     |
-| manhattan_ap                 | 0.7111     |
-| euclidean_accuracy           | 0.6606     |
-| euclidean_accuracy_threshold | 12.5284    |
-| euclidean_f1                 | 0.7052     |
-| euclidean_f1_threshold       | 13.9722    |
-| euclidean_precision          | 0.5951     |
-| euclidean_recall             | 0.8651     |
-| euclidean_ap                 | 0.7072     |
-| max_accuracy                 | 0.6613     |
-| max_accuracy_threshold       | 235.7874   |
-| max_f1                       | 0.7093     |
-| max_f1_threshold             | 285.1436   |
-| max_precision                | 0.6054     |
-| max_recall                   | 0.9325     |
-| **max_ap**                   | **0.7111** |
 <!--
 ## Bias, Risks and Limitations
@@ -366,10 +366,10 @@ You can finetune this model on your own dataset.
   {
       "loss": "MultipleNegativesRankingLoss",
       "n_layers_per_step": 1,
-      "last_layer_weight": 1.5,
-      "prior_layers_weight": 1,
       "kl_div_weight": 2,
-      "kl_temperature": 1
   }
   ```
@@ -396,10 +396,10 @@ You can finetune this model on your own dataset.
   {
       "loss": "MultipleNegativesRankingLoss",
       "n_layers_per_step": 1,
-      "last_layer_weight": 1.5,
-      "prior_layers_weight": 1,
       "kl_div_weight": 2,
-      "kl_temperature": 1
   }
   ```
@@ -538,34 +538,34 @@ You can finetune this model on your own dataset.
 ### Training Logs
 | Epoch  | Step | Training Loss | loss   | max_ap |
 |:------:|:----:|:-------------:|:------:|:------:|
-| 0.1004 | 150  | 6.8384        | -      | -      |
-| 0.2001 | 299  | -             | 6.3046 | 0.6155 |
-| 0.2008 | 300  | 5.9024        | -      | -      |
-| 0.3012 | 450  | 4.9822        | -      | -      |
-| 0.4003 | 598  | -             | 5.1572 | 0.6595 |
-| 0.4016 | 600  | 4.3996        | -      | -      |
-| 0.5020 | 750  | 3.6015        | -      | -      |
-| 0.6004 | 897  | -             | 4.0073 | 0.6904 |
-| 0.6024 | 900  | 3.0732        | -      | -      |
-| 0.7028 | 1050 | 2.7211        | -      | -      |
-| 0.8005 | 1196 | -             | 3.3433 | 0.7034 |
-| 0.8032 | 1200 | 2.4196        | -      | -      |
-| 0.9036 | 1350 | 2.2256        | -      | -      |
-| 1.0007 | 1495 | -             | 2.9401 | 0.7079 |
-| 1.0040 | 1500 | 2.0015        | -      | -      |
-| 1.1044 | 1650 | 1.9828        | -      | -      |
-| 1.2008 | 1794 | -             | 2.8339 | 0.7104 |
-| 1.2048 | 1800 | 1.8243        | -      | -      |
-| 1.3052 | 1950 | 1.7393        | -      | -      |
-| 1.4009 | 2093 | -             | 2.5906 | 0.7120 |
-| 1.4056 | 2100 | 1.7702        | -      | -      |
-| 1.5060 | 2250 | 1.615         | -      | -      |
-| 1.6011 | 2392 | -             | 2.5455 | 0.7111 |
-| 1.6064 | 2400 | 1.6249        | -      | -      |
-| 1.7068 | 2550 | 1.5804        | -      | -      |
-| 1.8012 | 2691 | -             | 2.4747 | 0.7111 |
-| 1.8072 | 2700 | 1.5935        | -      | -      |
-| 1.9076 | 2850 | 1.5088        | -      | -      |
 ### Framework Versions

       type: unknown
     metrics:
     - type: cosine_accuracy
+      value: 0.6651071536371869
       name: Cosine Accuracy
     - type: cosine_accuracy_threshold
+      value: 0.687929630279541
       name: Cosine Accuracy Threshold
     - type: cosine_f1
+      value: 0.7077349458301839
       name: Cosine F1
     - type: cosine_f1_threshold
+      value: 0.6304811239242554
       name: Cosine F1 Threshold
     - type: cosine_precision
+      value: 0.6222862206468763
       name: Cosine Precision
     - type: cosine_recall
+      value: 0.8203855140186916
       name: Cosine Recall
     - type: cosine_ap
+      value: 0.7058220689813709
       name: Cosine Ap
     - type: dot_accuracy
+      value: 0.6313009357078176
       name: Dot Accuracy
     - type: dot_accuracy_threshold
+      value: 135.98495483398438
       name: Dot Accuracy Threshold
     - type: dot_f1
+      value: 0.6997334569475027
       name: Dot F1
     - type: dot_f1_threshold
+      value: 115.54609680175781
       name: Dot F1 Threshold
     - type: dot_precision
+      value: 0.5800192122958694
       name: Dot Precision
     - type: dot_recall
+      value: 0.8817172897196262
       name: Dot Recall
     - type: dot_ap
+      value: 0.6554755795160082
       name: Dot Ap
     - type: manhattan_accuracy
+      value: 0.6708421370359191
       name: Manhattan Accuracy
     - type: manhattan_accuracy_threshold
+      value: 219.32388305664062
       name: Manhattan Accuracy Threshold
     - type: manhattan_f1
+      value: 0.7119951778179626
       name: Manhattan F1
     - type: manhattan_f1_threshold
+      value: 262.314697265625
       name: Manhattan F1 Threshold
     - type: manhattan_precision
+      value: 0.6062410182714022
       name: Manhattan Precision
     - type: manhattan_recall
+      value: 0.8624415887850467
       name: Manhattan Recall
     - type: manhattan_ap
+      value: 0.7135236162968746
       name: Manhattan Ap
     - type: euclidean_accuracy
+      value: 0.6652580742529429
       name: Euclidean Accuracy
     - type: euclidean_accuracy_threshold
+      value: 11.506816864013672
       name: Euclidean Accuracy Threshold
     - type: euclidean_f1
+      value: 0.7080090384132564
       name: Euclidean F1
     - type: euclidean_f1_threshold
+      value: 12.478536605834961
       name: Euclidean F1 Threshold
     - type: euclidean_precision
+      value: 0.6208718626155878
       name: Euclidean Precision
     - type: euclidean_recall
+      value: 0.8235981308411215
       name: Euclidean Recall
     - type: euclidean_ap
+      value: 0.7090362803652147
       name: Euclidean Ap
     - type: max_accuracy
+      value: 0.6708421370359191
       name: Max Accuracy
     - type: max_accuracy_threshold
+      value: 219.32388305664062
       name: Max Accuracy Threshold
     - type: max_f1
+      value: 0.7119951778179626
       name: Max F1
     - type: max_f1_threshold
+      value: 262.314697265625
       name: Max F1 Threshold
     - type: max_precision
+      value: 0.6222862206468763
       name: Max Precision
     - type: max_recall
+      value: 0.8817172897196262
       name: Max Recall
     - type: max_ap
+      value: 0.7135236162968746
       name: Max Ap
 ---
 | Metric                       | Value      |
 |:-----------------------------|:-----------|
+| cosine_accuracy              | 0.6651     |
+| cosine_accuracy_threshold    | 0.6879     |
+| cosine_f1                    | 0.7077     |
+| cosine_f1_threshold          | 0.6305     |
+| cosine_precision             | 0.6223     |
+| cosine_recall                | 0.8204     |
+| cosine_ap                    | 0.7058     |
+| dot_accuracy                 | 0.6313     |
+| dot_accuracy_threshold       | 135.985    |
+| dot_f1                       | 0.6997     |
+| dot_f1_threshold             | 115.5461   |
+| dot_precision                | 0.58       |
+| dot_recall                   | 0.8817     |
+| dot_ap                       | 0.6555     |
+| manhattan_accuracy           | 0.6708     |
+| manhattan_accuracy_threshold | 219.3239   |
+| manhattan_f1                 | 0.712      |
+| manhattan_f1_threshold       | 262.3147   |
+| manhattan_precision          | 0.6062     |
+| manhattan_recall             | 0.8624     |
+| manhattan_ap                 | 0.7135     |
+| euclidean_accuracy           | 0.6653     |
+| euclidean_accuracy_threshold | 11.5068    |
+| euclidean_f1                 | 0.708      |
+| euclidean_f1_threshold       | 12.4785    |
+| euclidean_precision          | 0.6209     |
+| euclidean_recall             | 0.8236     |
+| euclidean_ap                 | 0.709      |
+| max_accuracy                 | 0.6708     |
+| max_accuracy_threshold       | 219.3239   |
+| max_f1                       | 0.712      |
+| max_f1_threshold             | 262.3147   |
+| max_precision                | 0.6223     |
+| max_recall                   | 0.8817     |
+| **max_ap**                   | **0.7135** |
 <!--
 ## Bias, Risks and Limitations
   {
       "loss": "MultipleNegativesRankingLoss",
       "n_layers_per_step": 1,
+      "last_layer_weight": 1,
+      "prior_layers_weight": 0.05,
       "kl_div_weight": 2,
+      "kl_temperature": 0.9
   }
   ```
   {
       "loss": "MultipleNegativesRankingLoss",
       "n_layers_per_step": 1,
+      "last_layer_weight": 1,
+      "prior_layers_weight": 0.05,
       "kl_div_weight": 2,
+      "kl_temperature": 0.9
   }
   ```
 ### Training Logs
 | Epoch  | Step | Training Loss | loss   | max_ap |
 |:------:|:----:|:-------------:|:------:|:------:|
+| 0.1004 | 150  | 4.5827        | -      | -      |
+| 0.2001 | 299  | -             | 3.5735 | 0.6133 |
+| 0.2008 | 300  | 3.5451        | -      | -      |
+| 0.3012 | 450  | 2.9066        | -      | -      |
+| 0.4003 | 598  | -             | 2.8785 | 0.6561 |
+| 0.4016 | 600  | 2.5141        | -      | -      |
+| 0.5020 | 750  | 2.0248        | -      | -      |
+| 0.6004 | 897  | -             | 2.1300 | 0.6917 |
+| 0.6024 | 900  | 1.6782        | -      | -      |
+| 0.7028 | 1050 | 1.4187        | -      | -      |
+| 0.8005 | 1196 | -             | 1.7111 | 0.7051 |
+| 0.8032 | 1200 | 1.2446        | -      | -      |
+| 0.9036 | 1350 | 1.1078        | -      | -      |
+| 1.0007 | 1495 | -             | 1.4859 | 0.7108 |
+| 1.0040 | 1500 | 0.9827        | -      | -      |
+| 1.1044 | 1650 | 0.9335        | -      | -      |
+| 1.2008 | 1794 | -             | 1.3516 | 0.7121 |
+| 1.2048 | 1800 | 0.8595        | -      | -      |
+| 1.3052 | 1950 | 0.8362        | -      | -      |
+| 1.4009 | 2093 | -             | 1.2659 | 0.7147 |
+| 1.4056 | 2100 | 0.8167        | -      | -      |
+| 1.5060 | 2250 | 0.7695        | -      | -      |
+| 1.6011 | 2392 | -             | 1.2218 | 0.7135 |
+| 1.6064 | 2400 | 0.7544        | -      | -      |
+| 1.7068 | 2550 | 0.7625        | -      | -      |
+| 1.8012 | 2691 | -             | 1.2073 | 0.7135 |
+| 1.8072 | 2700 | 0.7366        | -      | -      |
+| 1.9076 | 2850 | 0.7348        | -      | -      |
 ### Framework Versions

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9b93c9d7c3dd14655bcd8b8f7526e0c331aeb9ead053243ae631a7970785cfee
 size 565251810

 version https://git-lfs.github.com/spec/v1
+oid sha256:d987747af13557ed9ce9d67bddcbcc93242a3bea2f8ca559470e5c3ae052aa72
 size 565251810