Model save

Files changed (9) hide show

all_results.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
     "epoch": 3.0,
     "train_loss": 4.621011098225911,
-    "train_runtime": 40.2608,
     "train_samples": 3000,
-    "train_samples_per_second": 223.543,
-    "train_steps_per_second": 0.894
 }

 {
     "epoch": 3.0,
     "train_loss": 4.621011098225911,
+    "train_runtime": 40.2946,
     "train_samples": 3000,
+    "train_samples_per_second": 223.355,
+    "train_steps_per_second": 0.893
 }

args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:487e31429614afd7e284f2fbbfa60f8641f08267f6cb8303e68bafbbe12cd651
 size 5652

 version https://git-lfs.github.com/spec/v1
+oid sha256:abc41cf6e45166d7704c9e792670b81f9584e8f4f477af4235a86aa107312ece
 size 5652

config.json CHANGED Viewed

@@ -2,7 +2,7 @@
   "_name_or_path": "distilbert-base-uncased",
   "activation": "gelu",
   "architectures": [
-    "QuantizedDistilBertForQuestionAnswering"
   ],
   "attention_dropout": 0.1,
   "dim": 768,

   "_name_or_path": "distilbert-base-uncased",
   "activation": "gelu",
   "architectures": [
+    "DistilBertForQuestionAnswering"
   ],
   "attention_dropout": 0.1,
   "dim": 768,

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b3ef050729f0931a1ab4b251d4ccc9bd10abefc57d7de8209769201e2e17232c
-size 265832945

 version https://git-lfs.github.com/spec/v1
+oid sha256:45f49d0d4ef9d2b6a142d56f5151687051e5e54606390c6de709e339848665c4
+size 265493026

raw_pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f1f0839ac6d21be64cac0d009add03e24b92d8146d213fbb1f1473a3a4c3ea9e
-size 265864653

 version https://git-lfs.github.com/spec/v1
+oid sha256:ace5d339b09a1b5d89214c499f75ccb2fefdcce154e576b06cc71a1361c8eb03
+size 435382250

tokenizer.json CHANGED Viewed

@@ -1,21 +1,7 @@
 {
   "version": "1.0",
-  "truncation": {
-    "direction": "Right",
-    "max_length": 384,
-    "strategy": "OnlySecond",
-    "stride": 128
-  },
-  "padding": {
-    "strategy": {
-      "Fixed": 384
-    },
-    "direction": "Right",
-    "pad_to_multiple_of": null,
-    "pad_id": 0,
-    "pad_type_id": 0,
-    "pad_token": "[PAD]"
-  },
   "added_tokens": [
     {
       "id": 0,

 {
   "version": "1.0",
+  "truncation": null,
+  "padding": null,
   "added_tokens": [
     {
       "id": 0,

train_results.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
     "epoch": 3.0,
     "train_loss": 4.621011098225911,
-    "train_runtime": 40.2608,
     "train_samples": 3000,
-    "train_samples_per_second": 223.543,
-    "train_steps_per_second": 0.894
 }

 {
     "epoch": 3.0,
     "train_loss": 4.621011098225911,
+    "train_runtime": 40.2946,
     "train_samples": 3000,
+    "train_samples_per_second": 223.355,
+    "train_steps_per_second": 0.893
 }

trainer_state.json CHANGED Viewed

@@ -13,9 +13,9 @@
       "step": 36,
       "total_flos": 881908425216000.0,
       "train_loss": 4.621011098225911,
-      "train_runtime": 40.2608,
-      "train_samples_per_second": 223.543,
-      "train_steps_per_second": 0.894
     }
   ],
   "logging_steps": 500,

       "step": 36,
       "total_flos": 881908425216000.0,
       "train_loss": 4.621011098225911,
+      "train_runtime": 40.2946,
+      "train_samples_per_second": 223.355,
+      "train_steps_per_second": 0.893
     }
   ],
   "logging_steps": 500,

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:907d06d261539b8a1e3605fab8d7d4bf5f2b4926be120fd5f849138fc9cb68e7
 size 4664

 version https://git-lfs.github.com/spec/v1
+oid sha256:232a44bf482ca5a92e56f6d7c781e94d5a384f3b15bcb46eef3b2e0869dcddd9
 size 4664