mfajcik commited on
Commit
4a42894
·
verified ·
1 Parent(s): 1a8e376

Upload 6 files

Browse files
config.json CHANGED
@@ -4,7 +4,7 @@
4
  "LlamaForCausalLM"
5
  ],
6
  "attention_bias": false,
7
- "attention_dropout": 0.1,
8
  "bos_token_id": null,
9
  "eos_token_id": 64001,
10
  "head_dim": 64,
@@ -20,11 +20,14 @@
20
  "num_key_value_heads": 4,
21
  "pretraining_tp": 1,
22
  "rms_norm_eps": 1e-05,
23
- "rope_scaling": null,
24
- "rope_theta": 10000.0,
 
 
 
25
  "tie_word_embeddings": false,
26
  "torch_dtype": "bfloat16",
27
  "transformers_version": "4.46.3",
28
  "use_cache": false,
29
- "vocab_size": 64003
30
  }
 
4
  "LlamaForCausalLM"
5
  ],
6
  "attention_bias": false,
7
+ "attention_dropout": 0.0,
8
  "bos_token_id": null,
9
  "eos_token_id": 64001,
10
  "head_dim": 64,
 
20
  "num_key_value_heads": 4,
21
  "pretraining_tp": 1,
22
  "rms_norm_eps": 1e-05,
23
+ "rope_scaling": {
24
+ "factor": 2.0,
25
+ "type": "linear"
26
+ },
27
+ "rope_theta": 100000,
28
  "tie_word_embeddings": false,
29
  "torch_dtype": "bfloat16",
30
  "transformers_version": "4.46.3",
31
  "use_cache": false,
32
+ "vocab_size": 64004
33
  }
generation_config.json CHANGED
@@ -3,5 +3,5 @@
3
  "do_sample": true,
4
  "eos_token_id": 64001,
5
  "transformers_version": "4.46.3",
6
- "use_cache": true
7
  }
 
3
  "do_sample": true,
4
  "eos_token_id": 64001,
5
  "transformers_version": "4.46.3",
6
+ "use_cache": false
7
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d30293143d9b87ac59ec5c6607434f662463f7eaebdbe2809d544245bf7706d7
3
- size 2462288496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db83583d9d104cab4c9ce859403fffc29e34839676e25ef08e24f965913228f3
3
+ size 2462296688
special_tokens_map.json CHANGED
@@ -7,7 +7,7 @@
7
  "single_word": false
8
  },
9
  "pad_token": {
10
- "content": "<|end_of_text|>",
11
  "lstrip": false,
12
  "normalized": false,
13
  "rstrip": false,
 
7
  "single_word": false
8
  },
9
  "pad_token": {
10
+ "content": "[EOS]",
11
  "lstrip": false,
12
  "normalized": false,
13
  "rstrip": false,
tokenizer.json CHANGED
@@ -1,7 +1,14 @@
1
  {
2
  "version": "1.0",
3
  "truncation": null,
4
- "padding": null,
 
 
 
 
 
 
 
5
  "added_tokens": [
6
  {
7
  "id": 0,
@@ -32,12 +39,21 @@
32
  },
33
  {
34
  "id": 64002,
35
- "content": "<|end_of_text|>",
36
  "single_word": false,
37
  "lstrip": false,
38
  "rstrip": false,
39
  "normalized": false,
40
- "special": true
 
 
 
 
 
 
 
 
 
41
  }
42
  ],
43
  "normalizer": null,
 
1
  {
2
  "version": "1.0",
3
  "truncation": null,
4
+ "padding": {
5
+ "strategy": "BatchLongest",
6
+ "direction": "Right",
7
+ "pad_to_multiple_of": null,
8
+ "pad_id": 64001,
9
+ "pad_type_id": 0,
10
+ "pad_token": "[EOS]"
11
+ },
12
  "added_tokens": [
13
  {
14
  "id": 0,
 
39
  },
40
  {
41
  "id": 64002,
42
+ "content": "|Výsledky|",
43
  "single_word": false,
44
  "lstrip": false,
45
  "rstrip": false,
46
  "normalized": false,
47
+ "special": false
48
+ },
49
+ {
50
+ "id": 64003,
51
+ "content": "|Shrnutí|",
52
+ "single_word": false,
53
+ "lstrip": false,
54
+ "rstrip": false,
55
+ "normalized": false,
56
+ "special": false
57
  }
58
  ],
59
  "normalizer": null,
tokenizer_config.json CHANGED
@@ -25,18 +25,26 @@
25
  "special": true
26
  },
27
  "64002": {
28
- "content": "<|end_of_text|>",
29
  "lstrip": false,
30
  "normalized": false,
31
  "rstrip": false,
32
  "single_word": false,
33
- "special": true
 
 
 
 
 
 
 
 
34
  }
35
  },
36
  "clean_up_tokenization_spaces": true,
37
  "eos_token": "[EOS]",
38
- "model_max_length": 16384,
39
- "pad_token": "<|end_of_text|>",
40
  "tokenizer_class": "PreTrainedTokenizerFast",
41
  "unk_token": "[UNK]"
42
  }
 
25
  "special": true
26
  },
27
  "64002": {
28
+ "content": "|Výsledky|",
29
  "lstrip": false,
30
  "normalized": false,
31
  "rstrip": false,
32
  "single_word": false,
33
+ "special": false
34
+ },
35
+ "64003": {
36
+ "content": "|Shrnutí|",
37
+ "lstrip": false,
38
+ "normalized": false,
39
+ "rstrip": false,
40
+ "single_word": false,
41
+ "special": false
42
  }
43
  },
44
  "clean_up_tokenization_spaces": true,
45
  "eos_token": "[EOS]",
46
+ "model_max_length": 2048,
47
+ "pad_token": "[EOS]",
48
  "tokenizer_class": "PreTrainedTokenizerFast",
49
  "unk_token": "[UNK]"
50
  }