Upload 5 files

Browse files

Files changed (5) hide show

config.json +38 -0
generation_config.json +9 -0
measurement.json +0 -0
tokenizer.json +0 -0
tokenizer_config.json +35 -0

config.json ADDED Viewed

	@@ -0,0 +1,38 @@

+{
+	"architectures": [
+		"Qwen2ForCausalLM"
+	],
+	"attention_dropout": 0.0,
+	"bos_token_id": 151643,
+	"eos_token_id": 151643,
+	"hidden_act": "silu",
+	"hidden_size": 5120,
+	"initializer_range": 0.02,
+	"intermediate_size": 13824,
+	"max_position_embeddings": 131072,
+	"max_window_layers": 48,
+	"model_type": "qwen2",
+	"num_attention_heads": 40,
+	"num_hidden_layers": 48,
+	"num_key_value_heads": 8,
+	"quantization_config": {
+		"bits": 4.5,
+		"calibration": {
+			"dataset": "(default)",
+			"length": 2048,
+			"rows": 115
+		},
+		"head_bits": 6,
+		"quant_method": "exl2",
+		"version": "0.2.7"
+	},
+	"rms_norm_eps": 1e-05,
+	"rope_theta": 1000000.0,
+	"sliding_window": 131072,
+	"tie_word_embeddings": false,
+	"torch_dtype": "bfloat16",
+	"transformers_version": "4.43.1",
+	"use_cache": true,
+	"use_sliding_window": false,
+	"vocab_size": 152064
+}

generation_config.json ADDED Viewed

	@@ -0,0 +1,9 @@

+{
+	"_from_model_config": true,
+	"bos_token_id": 151646,
+	"do_sample": true,
+	"eos_token_id": 151643,
+	"temperature": 0.6,
+	"top_p": 0.95,
+	"transformers_version": "4.39.3"
+}

measurement.json ADDED Viewed

The diff for this file is too large to render. See raw diff

tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,35 @@

+{
+	"add_bos_token": true,
+	"add_eos_token": false,
+	"bos_token": {
+		"__type": "AddedToken",
+		"content": "<｜begin▁of▁sentence｜>",
+		"lstrip": false,
+		"normalized": true,
+		"rstrip": false,
+		"single_word": false
+	},
+	"chat_template": "{% if not add_generation_prompt is defined %}{% set add_generation_prompt = false %}{% endif %}{% set ns = namespace(is_first=false, is_tool=false, is_output_first=true, system_prompt='') %}{%- for message in messages %}{%- if message['role'] == 'system' %}{% set ns.system_prompt = message['content'] %}{%- endif %}{%- endfor %}{{bos_token}}{{ns.system_prompt}}{%- for message in messages %}{%- if message['role'] == 'user' %}{%- set ns.is_tool = false -%}{{'<｜User｜>' + message['content']}}{%- endif %}{%- if message['role'] == 'assistant' and message['content'] is none %}{%- set ns.is_tool = false -%}{%- for tool in message['tool_calls']%}{%- if not ns.is_first %}{{'<｜Assistant｜><｜tool▁calls▁begin｜><｜tool▁call▁begin｜>' + tool['type'] + '<｜tool▁sep｜>' + tool['function']['name'] + '\\n' + '```json' + '\\n' + tool['function']['arguments'] + '\\n' + '```' + '<｜tool▁call▁end｜>'}}{%- set ns.is_first = true -%}{%- else %}{{'\\n' + '<｜tool▁call▁begin｜>' + tool['type'] + '<｜tool▁sep｜>' + tool['function']['name'] + '\\n' + '```json' + '\\n' + tool['function']['arguments'] + '\\n' + '```' + '<｜tool▁call▁end｜>'}}{{'<｜tool▁calls▁end｜><｜end▁of▁sentence｜>'}}{%- endif %}{%- endfor %}{%- endif %}{%- if message['role'] == 'assistant' and message['content'] is not none %}{%- if ns.is_tool %}{{'<｜tool▁outputs▁end｜>' + message['content'] + '<｜end▁of▁sentence｜>'}}{%- set ns.is_tool = false -%}{%- else %}{% set content = message['content'] %}{% if '</think>' in content %}{% set content = content.split('</think>')[-1] %}{% endif %}{{'<｜Assistant｜>' + content + '<｜end▁of▁sentence｜>'}}{%- endif %}{%- endif %}{%- if message['role'] == 'tool' %}{%- set ns.is_tool = true -%}{%- if ns.is_output_first %}{{'<｜tool▁outputs▁begin｜><｜tool▁output▁begin｜>' + message['content'] + '<｜tool▁output▁end｜>'}}{%- set ns.is_output_first = false %}{%- else %}{{'\\n<｜tool▁output▁begin｜>' + message['content'] + '<｜tool▁output▁end｜>'}}{%- endif %}{%- endif %}{%- endfor -%}{% if ns.is_tool %}{{'<｜tool▁outputs▁end｜>'}}{% endif %}{% if add_generation_prompt and not ns.is_tool %}{{'<｜Assistant｜>'}}{% endif %}",
+	"clean_up_tokenization_spaces": false,
+	"eos_token": {
+		"__type": "AddedToken",
+		"content": "<｜end▁of▁sentence｜>",
+		"lstrip": false,
+		"normalized": true,
+		"rstrip": false,
+		"single_word": false
+	},
+	"legacy": true,
+	"model_max_length": 16384,
+	"pad_token": {
+		"__type": "AddedToken",
+		"content": "<｜end▁of▁sentence｜>",
+		"lstrip": false,
+		"normalized": true,
+		"rstrip": false,
+		"single_word": false
+	},
+	"sp_model_kwargs": {},
+	"tokenizer_class": "LlamaTokenizerFast",
+	"unk_token": null
+}