File size: 513 Bytes
818fbd3 ed1975c 818fbd3 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 |
{
"attention_layers": [
12,
13
],
"auto_mapping": null,
"base_model_name_or_path": "meta-llama/Llama-3.2-1B",
"cache_dtype": "float16",
"cache_size": 32768,
"cache_type": "FIFO",
"compression_factor": 4,
"context_size": 1,
"global_cache": false,
"inference_mode": true,
"neighborhood_size": 2,
"neurocache_type": "ONDEVICE",
"pooling_window": 8,
"retrieval_map": {
"12": 12
},
"retrieval_stride": 2,
"similarity_fn": "l2",
"task_type": "CAUSAL_LM",
"topk": 8
}
|