Training in progress, epoch 1

Files changed (6) hide show

config.json CHANGED Viewed

@@ -22,7 +22,7 @@
   "position_embedding_type": "absolute",
   "problem_type": "single_label_classification",
   "torch_dtype": "float32",
-  "transformers_version": "4.23.1",
   "type_vocab_size": 1,
   "use_cache": true,
   "vocab_size": 50262

   "position_embedding_type": "absolute",
   "problem_type": "single_label_classification",
   "torch_dtype": "float32",
+  "transformers_version": "4.33.1",
   "type_vocab_size": 1,
   "use_cache": true,
   "vocab_size": 50262

merges.txt CHANGED Viewed

@@ -1,4 +1,4 @@
-#version: 0.2 - Trained by `huggingface/tokenizers`
 Ġ d
 Ġ e
 Ġd e

+#version: 0.2
 Ġ d
 Ġ e
 Ġd e

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8b18a61953553101e186554be45449482b6462fff4cff89e4ee2415b1dc1995a
-size 498651117

 version https://git-lfs.github.com/spec/v1
+oid sha256:bd0791352d8e92b5dc76ba3f01834755c1e8c64a2f7c4aac00ca65917fcc7a57
+size 498648433

tokenizer.json CHANGED Viewed

@@ -94,6 +94,7 @@
     "continuing_subword_prefix": "",
     "end_of_word_suffix": "",
     "fuse_unk": false,
     "vocab": {
       "<s>": 0,
       "<pad>": 1,

     "continuing_subword_prefix": "",
     "end_of_word_suffix": "",
     "fuse_unk": false,
+    "byte_fallback": false,
     "vocab": {
       "<s>": 0,
       "<pad>": 1,

tokenizer_config.json CHANGED Viewed

@@ -8,6 +8,7 @@
     "rstrip": false,
     "single_word": false
   },
   "cls_token": {
     "__type": "AddedToken",
     "content": "<s>",
@@ -34,7 +35,9 @@
     "single_word": false
   },
   "max_len": 512,
-  "name_or_path": "davidmasip/racism",
   "pad_token": {
     "__type": "AddedToken",
     "content": "<pad>",
@@ -43,6 +46,8 @@
     "rstrip": false,
     "single_word": false
   },
   "sep_token": {
     "__type": "AddedToken",
     "content": "</s>",
@@ -51,9 +56,11 @@
     "rstrip": false,
     "single_word": false
   },
-  "special_tokens_map_file": null,
   "tokenizer_class": "RobertaTokenizer",
   "trim_offsets": true,
   "unk_token": {
     "__type": "AddedToken",
     "content": "<unk>",

     "rstrip": false,
     "single_word": false
   },
+  "clean_up_tokenization_spaces": true,
   "cls_token": {
     "__type": "AddedToken",
     "content": "<s>",
     "single_word": false
   },
   "max_len": 512,
+  "max_length": 512,
+  "model_max_length": 512,
+  "pad_to_multiple_of": null,
   "pad_token": {
     "__type": "AddedToken",
     "content": "<pad>",
     "rstrip": false,
     "single_word": false
   },
+  "pad_token_type_id": 0,
+  "padding_side": "right",
   "sep_token": {
     "__type": "AddedToken",
     "content": "</s>",
     "rstrip": false,
     "single_word": false
   },
+  "stride": 0,
   "tokenizer_class": "RobertaTokenizer",
   "trim_offsets": true,
+  "truncation_side": "right",
+  "truncation_strategy": "longest_first",
   "unk_token": {
     "__type": "AddedToken",
     "content": "<unk>",

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f522e4e5e5c4602e9e52b85697cb1da6bed2fe4b9b9eb1dadbd644e06adca5fb
-size 3375

 version https://git-lfs.github.com/spec/v1
+oid sha256:51c53e51bc0583c25102a09dcf47148e135e3cc3ce26901ca34305cf871385c3
+size 4027