Pamzyy commited on
Commit
a0ffedd
·
verified ·
1 Parent(s): a73ed34

Training in progress, step 10

Browse files
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "meta-llama/Meta-Llama-3.1-8B",
3
  "architectures": [
4
  "LlamaForCausalLM"
5
  ],
@@ -31,6 +31,6 @@
31
  "tie_word_embeddings": false,
32
  "torch_dtype": "float32",
33
  "transformers_version": "4.47.1",
34
- "use_cache": true,
35
  "vocab_size": 138626
36
  }
 
1
  {
2
+ "_name_or_path": "./results/checkpoint-5",
3
  "architectures": [
4
  "LlamaForCausalLM"
5
  ],
 
31
  "tie_word_embeddings": false,
32
  "torch_dtype": "float32",
33
  "transformers_version": "4.47.1",
34
+ "use_cache": false,
35
  "vocab_size": 138626
36
  }
model-00001-of-00007.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:12ebfae5b8af8f447067dbedf26bc342f37b5c13f8b716236fc5a44ff83e5ba7
3
  size 4989259264
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ebcd14bdbdd3c05edbe0118b32e695884e56557186618cb4af04d25a6e280c5e
3
  size 4989259264
model-00007-of-00007.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:80d89a79f5f4cdf17c2f149173b6ae2588b1ed0d2987bb36aeb5c3d9afedb81e
3
  size 2741060264
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:049178a0a1fca0c71684df102e88a2c177985e764e887cc4a546a3e01be5c122
3
  size 2741060264
tokenizer_config.json CHANGED
@@ -2053,11 +2053,18 @@
2053
  "clean_up_tokenization_spaces": true,
2054
  "eos_token": "<|end_of_text|>",
2055
  "extra_special_tokens": {},
 
2056
  "model_input_names": [
2057
  "input_ids",
2058
  "attention_mask"
2059
  ],
2060
  "model_max_length": 131072,
 
2061
  "pad_token": "<|end_of_text|>",
2062
- "tokenizer_class": "PreTrainedTokenizerFast"
 
 
 
 
 
2063
  }
 
2053
  "clean_up_tokenization_spaces": true,
2054
  "eos_token": "<|end_of_text|>",
2055
  "extra_special_tokens": {},
2056
+ "max_length": 512,
2057
  "model_input_names": [
2058
  "input_ids",
2059
  "attention_mask"
2060
  ],
2061
  "model_max_length": 131072,
2062
+ "pad_to_multiple_of": null,
2063
  "pad_token": "<|end_of_text|>",
2064
+ "pad_token_type_id": 0,
2065
+ "padding_side": "right",
2066
+ "stride": 0,
2067
+ "tokenizer_class": "PreTrainedTokenizerFast",
2068
+ "truncation_side": "right",
2069
+ "truncation_strategy": "longest_first"
2070
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7a908ade51cd9b861382462385f51c098680a2e9c61e12916af6dea0e00d0e95
3
- size 5304
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1f8d8edb60ee54eabba281f40c9e9a60149ef8b8806d512b31a4d69a1bbc874
3
+ size 5368