PatrickSchwabl
/

distilbert_fearspeech_classifier

Text Classification

Inference Endpoints

Model card Files Files and versions Community

PatrickSchwabl commited on Jul 17

Commit

3b047b1

•

1 Parent(s): d464339

Upload 6 files

Files changed (4) hide show

config.json +4 -3
pytorch_model.bin +2 -2
tokenizer.json +2 -2
tokenizer_config.json +6 -0

config.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
-  "_name_or_path": "./results/runs_fearspeech/checkpoint-320000",
   "activation": "gelu",
   "architectures": [
-    "DistilBertForMaskedLM"
   ],
   "attention_dropout": 0.1,
   "dim": 768,
@@ -15,11 +15,12 @@
   "n_layers": 6,
   "output_past": true,
   "pad_token_id": 0,
   "qa_dropout": 0.1,
   "seq_classif_dropout": 0.2,
   "sinusoidal_pos_embds": true,
   "tie_weights_": true,
   "torch_dtype": "float32",
-  "transformers_version": "4.30.2",
   "vocab_size": 31102
 }

 {
+  "_name_or_path": "/home/fear_speech_project/BERT_final_domain_adapted_model/",
   "activation": "gelu",
   "architectures": [
+    "DistilBertForSequenceClassification"
   ],
   "attention_dropout": 0.1,
   "dim": 768,
   "n_layers": 6,
   "output_past": true,
   "pad_token_id": 0,
+  "problem_type": "single_label_classification",
   "qa_dropout": 0.1,
   "seq_classif_dropout": 0.2,
   "sinusoidal_pos_embds": true,
   "tie_weights_": true,
   "torch_dtype": "float32",
+  "transformers_version": "4.31.0",
   "vocab_size": 31102
 }

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fd9868ef027c467a1a188ca7ff6f0e2b89a51bad616eedf34ca3a9df1a7e003d
-size 269762097

 version https://git-lfs.github.com/spec/v1
+oid sha256:70ccb0e661419e401a51a9336279ccb82a5ed5bc379f1845becd3c7103763ec4
+size 269637293

tokenizer.json CHANGED Viewed

@@ -2,13 +2,13 @@
   "version": "1.0",
   "truncation": {
     "direction": "Right",
-    "max_length": 512,
     "strategy": "LongestFirst",
     "stride": 0
   },
   "padding": {
     "strategy": {
-      "Fixed": 512
     },
     "direction": "Right",
     "pad_to_multiple_of": null,

   "version": "1.0",
   "truncation": {
     "direction": "Right",
+    "max_length": 128,
     "strategy": "LongestFirst",
     "stride": 0
   },
   "padding": {
     "strategy": {
+      "Fixed": 128
     },
     "direction": "Right",
     "pad_to_multiple_of": null,

tokenizer_config.json CHANGED Viewed

@@ -5,13 +5,19 @@
   "mask_token": "[MASK]",
   "max_length": 512,
   "model_max_length": 512,
   "pad_token": "[PAD]",
   "padding": "max_length",
   "return_tensors": "pt",
   "sep_token": "[SEP]",
   "strip_accents": null,
   "tokenize_chinese_chars": true,
   "tokenizer_class": "DistilBertTokenizer",
   "truncation": false,
   "unk_token": "[UNK]"
 }

   "mask_token": "[MASK]",
   "max_length": 512,
   "model_max_length": 512,
+  "pad_to_multiple_of": null,
   "pad_token": "[PAD]",
+  "pad_token_type_id": 0,
   "padding": "max_length",
+  "padding_side": "right",
   "return_tensors": "pt",
   "sep_token": "[SEP]",
+  "stride": 0,
   "strip_accents": null,
   "tokenize_chinese_chars": true,
   "tokenizer_class": "DistilBertTokenizer",
   "truncation": false,
+  "truncation_side": "right",
+  "truncation_strategy": "longest_first",
   "unk_token": "[UNK]"
 }