genne commited on
Commit
7e0c6bc
1 Parent(s): a53f34e

Upload tokenizer

Browse files
Files changed (3) hide show
  1. README.md +1 -1
  2. special_tokens_map.json +1 -1
  3. tokenizer_config.json +3 -4
README.md CHANGED
@@ -1,10 +1,10 @@
1
  ---
2
  license: apache-2.0
3
- base_model: yanolja/EEVE-Korean-Instruct-10.8B-v1.0
4
  tags:
5
  - trl
6
  - dpo
7
  - generated_from_trainer
 
8
  model-index:
9
  - name: nhn_dpo_v3-eeve_EEVE-Korean-Instruct-10.8B-v1.0_DPO
10
  results: []
 
1
  ---
2
  license: apache-2.0
 
3
  tags:
4
  - trl
5
  - dpo
6
  - generated_from_trainer
7
+ base_model: yanolja/EEVE-Korean-Instruct-10.8B-v1.0
8
  model-index:
9
  - name: nhn_dpo_v3-eeve_EEVE-Korean-Instruct-10.8B-v1.0_DPO
10
  results: []
special_tokens_map.json CHANGED
@@ -7,7 +7,7 @@
7
  "single_word": false
8
  },
9
  "eos_token": {
10
- "content": "<|im_end|>",
11
  "lstrip": false,
12
  "normalized": false,
13
  "rstrip": false,
 
7
  "single_word": false
8
  },
9
  "eos_token": {
10
+ "content": "</s>",
11
  "lstrip": false,
12
  "normalized": false,
13
  "rstrip": false,
tokenizer_config.json CHANGED
@@ -37,13 +37,12 @@
37
  },
38
  "additional_special_tokens": [],
39
  "bos_token": "<s>",
40
- "chat_template": "{% if messages[0]['role'] == 'system' %}{% set loop_messages = messages[1:] %}{% set system_message = messages[0]['content'] %}{% else %}{% set loop_messages = messages %}{% set system_message = 'You are a helpful assistant.' %}{% endif %}{% if not add_generation_prompt is defined %}{% set add_generation_prompt = false %}{% endif %}{% for message in loop_messages %}{% if loop.index0 == 0 %}{{'<|im_start|>system\n' + system_message + '<|im_end|>\n'}}{% endif %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
41
  "clean_up_tokenization_spaces": false,
42
- "eos_token": "<|im_end|>",
43
  "legacy": true,
44
- "model_max_length": 1024,
45
  "pad_token": "</s>",
46
- "padding_size": "right",
47
  "sp_model_kwargs": {},
48
  "spaces_between_special_tokens": false,
49
  "tokenizer_class": "LlamaTokenizer",
 
37
  },
38
  "additional_special_tokens": [],
39
  "bos_token": "<s>",
40
+ "chat_template": "{% if messages[0]['role'] == 'system' %}{% set loop_messages = messages[1:] %}{% set system_message = messages[0]['content'] %}{% else %}{% set loop_messages = messages %}{% set system_message = \"A chat between a curious user and an artificial intelligence assistant. The assistant gives helpful, detailed, and polite answers to the user's questions.\" %}{% endif %}{% for message in loop_messages %}{% if loop.index0 == 0 %}{{system_message + '\n'}}{% endif %}{% if message['role'] == 'user' %}{{'Human: ' + message['content']+'\n'}}{% elif message['role'] == 'assistant' %}{{'Assistant: ' + message['content']+'\n'}}{% endif %}{% if loop.last and add_generation_prompt %}{{'Assistant: ' }}{% endif %}{% endfor %}",
41
  "clean_up_tokenization_spaces": false,
42
+ "eos_token": "</s>",
43
  "legacy": true,
44
+ "model_max_length": 1000000000000000019884624838656,
45
  "pad_token": "</s>",
 
46
  "sp_model_kwargs": {},
47
  "spaces_between_special_tokens": false,
48
  "tokenizer_class": "LlamaTokenizer",