ikoghoemmanuell commited on
Commit
d5f7c84
1 Parent(s): 8f3e7bc

Upload XLNetForSequenceClassification

Browse files
Files changed (2) hide show
  1. config.json +35 -19
  2. pytorch_model.bin +2 -2
config.json CHANGED
@@ -1,38 +1,54 @@
1
  {
2
- "_name_or_path": "roberta-base",
3
  "architectures": [
4
- "RobertaForSequenceClassification"
5
  ],
6
- "attention_probs_dropout_prob": 0.1,
7
- "bos_token_id": 0,
8
- "classifier_dropout": null,
 
 
 
 
 
 
9
  "eos_token_id": 2,
10
- "hidden_act": "gelu",
11
- "hidden_dropout_prob": 0.1,
12
- "hidden_size": 768,
13
  "id2label": {
14
  "0": "LABEL_0",
15
  "1": "LABEL_1",
16
  "2": "LABEL_2"
17
  },
18
  "initializer_range": 0.02,
19
- "intermediate_size": 3072,
20
  "label2id": {
21
  "LABEL_0": 0,
22
  "LABEL_1": 1,
23
  "LABEL_2": 2
24
  },
25
- "layer_norm_eps": 1e-05,
26
- "max_position_embeddings": 514,
27
- "model_type": "roberta",
28
- "num_attention_heads": 12,
29
- "num_hidden_layers": 12,
30
- "pad_token_id": 1,
31
- "position_embedding_type": "absolute",
32
  "problem_type": "single_label_classification",
 
 
 
 
 
 
 
 
 
 
 
 
 
33
  "torch_dtype": "float32",
34
  "transformers_version": "4.29.2",
35
- "type_vocab_size": 1,
36
- "use_cache": true,
37
- "vocab_size": 50265
 
38
  }
 
1
  {
2
+ "_name_or_path": "xlnet-base-cased",
3
  "architectures": [
4
+ "XLNetForSequenceClassification"
5
  ],
6
+ "attn_type": "bi",
7
+ "bi_data": false,
8
+ "bos_token_id": 1,
9
+ "clamp_len": -1,
10
+ "d_head": 64,
11
+ "d_inner": 3072,
12
+ "d_model": 768,
13
+ "dropout": 0.1,
14
+ "end_n_top": 5,
15
  "eos_token_id": 2,
16
+ "ff_activation": "gelu",
 
 
17
  "id2label": {
18
  "0": "LABEL_0",
19
  "1": "LABEL_1",
20
  "2": "LABEL_2"
21
  },
22
  "initializer_range": 0.02,
 
23
  "label2id": {
24
  "LABEL_0": 0,
25
  "LABEL_1": 1,
26
  "LABEL_2": 2
27
  },
28
+ "layer_norm_eps": 1e-12,
29
+ "mem_len": null,
30
+ "model_type": "xlnet",
31
+ "n_head": 12,
32
+ "n_layer": 12,
33
+ "pad_token_id": 5,
 
34
  "problem_type": "single_label_classification",
35
+ "reuse_len": null,
36
+ "same_length": false,
37
+ "start_n_top": 5,
38
+ "summary_activation": "tanh",
39
+ "summary_last_dropout": 0.1,
40
+ "summary_type": "last",
41
+ "summary_use_proj": true,
42
+ "task_specific_params": {
43
+ "text-generation": {
44
+ "do_sample": true,
45
+ "max_length": 250
46
+ }
47
+ },
48
  "torch_dtype": "float32",
49
  "transformers_version": "4.29.2",
50
+ "untie_r": true,
51
+ "use_mems_eval": true,
52
+ "use_mems_train": false,
53
+ "vocab_size": 32000
54
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0f7b1ff1b214ef74b5c9aca2f393c0cbf21f890e0c49461266641e7569fdea66
3
- size 498665141
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:75598ef3c8326311178f9dda2f0b927076731d3fb09bdb707a38c1643d7af141
3
+ size 469314837