File size: 24,941 Bytes
6059b30 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 |
{
"metadata": {
"total_size": 16031162368
},
"weight_map": {
"model.transformer.blocks.0.attn_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.0.attn_out.weight": "model-00001-of-00006.safetensors",
"model.transformer.blocks.0.ff_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.0.ff_out.weight": "model-00002-of-00006.safetensors",
"model.transformer.blocks.0.ff_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.0.k_proj.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.0.q_proj.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.0.up_proj.weight": "model-00005-of-00006.safetensors",
"model.transformer.blocks.0.v_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.1.attn_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.1.attn_out.weight": "model-00001-of-00006.safetensors",
"model.transformer.blocks.1.ff_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.1.ff_out.weight": "model-00002-of-00006.safetensors",
"model.transformer.blocks.1.ff_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.1.k_proj.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.1.q_proj.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.1.up_proj.weight": "model-00005-of-00006.safetensors",
"model.transformer.blocks.1.v_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.10.attn_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.10.attn_out.weight": "model-00001-of-00006.safetensors",
"model.transformer.blocks.10.ff_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.10.ff_out.weight": "model-00002-of-00006.safetensors",
"model.transformer.blocks.10.ff_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.10.k_proj.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.10.q_proj.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.10.up_proj.weight": "model-00005-of-00006.safetensors",
"model.transformer.blocks.10.v_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.11.attn_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.11.attn_out.weight": "model-00001-of-00006.safetensors",
"model.transformer.blocks.11.ff_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.11.ff_out.weight": "model-00002-of-00006.safetensors",
"model.transformer.blocks.11.ff_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.11.k_proj.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.11.q_proj.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.11.up_proj.weight": "model-00006-of-00006.safetensors",
"model.transformer.blocks.11.v_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.12.attn_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.12.attn_out.weight": "model-00001-of-00006.safetensors",
"model.transformer.blocks.12.ff_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.12.ff_out.weight": "model-00002-of-00006.safetensors",
"model.transformer.blocks.12.ff_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.12.k_proj.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.12.q_proj.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.12.up_proj.weight": "model-00006-of-00006.safetensors",
"model.transformer.blocks.12.v_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.13.attn_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.13.attn_out.weight": "model-00001-of-00006.safetensors",
"model.transformer.blocks.13.ff_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.13.ff_out.weight": "model-00002-of-00006.safetensors",
"model.transformer.blocks.13.ff_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.13.k_proj.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.13.q_proj.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.13.up_proj.weight": "model-00006-of-00006.safetensors",
"model.transformer.blocks.13.v_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.14.attn_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.14.attn_out.weight": "model-00001-of-00006.safetensors",
"model.transformer.blocks.14.ff_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.14.ff_out.weight": "model-00002-of-00006.safetensors",
"model.transformer.blocks.14.ff_proj.weight": "model-00005-of-00006.safetensors",
"model.transformer.blocks.14.k_proj.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.14.q_proj.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.14.up_proj.weight": "model-00006-of-00006.safetensors",
"model.transformer.blocks.14.v_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.15.attn_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.15.attn_out.weight": "model-00001-of-00006.safetensors",
"model.transformer.blocks.15.ff_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.15.ff_out.weight": "model-00002-of-00006.safetensors",
"model.transformer.blocks.15.ff_proj.weight": "model-00005-of-00006.safetensors",
"model.transformer.blocks.15.k_proj.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.15.q_proj.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.15.up_proj.weight": "model-00006-of-00006.safetensors",
"model.transformer.blocks.15.v_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.16.attn_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.16.attn_out.weight": "model-00001-of-00006.safetensors",
"model.transformer.blocks.16.ff_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.16.ff_out.weight": "model-00002-of-00006.safetensors",
"model.transformer.blocks.16.ff_proj.weight": "model-00005-of-00006.safetensors",
"model.transformer.blocks.16.k_proj.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.16.q_proj.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.16.up_proj.weight": "model-00006-of-00006.safetensors",
"model.transformer.blocks.16.v_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.17.attn_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.17.attn_out.weight": "model-00001-of-00006.safetensors",
"model.transformer.blocks.17.ff_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.17.ff_out.weight": "model-00002-of-00006.safetensors",
"model.transformer.blocks.17.ff_proj.weight": "model-00005-of-00006.safetensors",
"model.transformer.blocks.17.k_proj.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.17.q_proj.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.17.up_proj.weight": "model-00006-of-00006.safetensors",
"model.transformer.blocks.17.v_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.18.attn_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.18.attn_out.weight": "model-00001-of-00006.safetensors",
"model.transformer.blocks.18.ff_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.18.ff_out.weight": "model-00002-of-00006.safetensors",
"model.transformer.blocks.18.ff_proj.weight": "model-00005-of-00006.safetensors",
"model.transformer.blocks.18.k_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.18.q_proj.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.18.up_proj.weight": "model-00006-of-00006.safetensors",
"model.transformer.blocks.18.v_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.19.attn_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.19.attn_out.weight": "model-00001-of-00006.safetensors",
"model.transformer.blocks.19.ff_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.19.ff_out.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.19.ff_proj.weight": "model-00005-of-00006.safetensors",
"model.transformer.blocks.19.k_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.19.q_proj.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.19.up_proj.weight": "model-00006-of-00006.safetensors",
"model.transformer.blocks.19.v_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.2.attn_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.2.attn_out.weight": "model-00001-of-00006.safetensors",
"model.transformer.blocks.2.ff_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.2.ff_out.weight": "model-00002-of-00006.safetensors",
"model.transformer.blocks.2.ff_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.2.k_proj.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.2.q_proj.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.2.up_proj.weight": "model-00005-of-00006.safetensors",
"model.transformer.blocks.2.v_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.20.attn_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.20.attn_out.weight": "model-00001-of-00006.safetensors",
"model.transformer.blocks.20.ff_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.20.ff_out.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.20.ff_proj.weight": "model-00005-of-00006.safetensors",
"model.transformer.blocks.20.k_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.20.q_proj.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.20.up_proj.weight": "model-00006-of-00006.safetensors",
"model.transformer.blocks.20.v_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.21.attn_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.21.attn_out.weight": "model-00001-of-00006.safetensors",
"model.transformer.blocks.21.ff_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.21.ff_out.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.21.ff_proj.weight": "model-00005-of-00006.safetensors",
"model.transformer.blocks.21.k_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.21.q_proj.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.21.up_proj.weight": "model-00006-of-00006.safetensors",
"model.transformer.blocks.21.v_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.22.attn_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.22.attn_out.weight": "model-00001-of-00006.safetensors",
"model.transformer.blocks.22.ff_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.22.ff_out.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.22.ff_proj.weight": "model-00005-of-00006.safetensors",
"model.transformer.blocks.22.k_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.22.q_proj.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.22.up_proj.weight": "model-00006-of-00006.safetensors",
"model.transformer.blocks.22.v_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.23.attn_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.23.attn_out.weight": "model-00001-of-00006.safetensors",
"model.transformer.blocks.23.ff_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.23.ff_out.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.23.ff_proj.weight": "model-00005-of-00006.safetensors",
"model.transformer.blocks.23.k_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.23.q_proj.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.23.up_proj.weight": "model-00006-of-00006.safetensors",
"model.transformer.blocks.23.v_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.24.attn_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.24.attn_out.weight": "model-00001-of-00006.safetensors",
"model.transformer.blocks.24.ff_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.24.ff_out.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.24.ff_proj.weight": "model-00005-of-00006.safetensors",
"model.transformer.blocks.24.k_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.24.q_proj.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.24.up_proj.weight": "model-00006-of-00006.safetensors",
"model.transformer.blocks.24.v_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.25.attn_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.25.attn_out.weight": "model-00001-of-00006.safetensors",
"model.transformer.blocks.25.ff_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.25.ff_out.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.25.ff_proj.weight": "model-00005-of-00006.safetensors",
"model.transformer.blocks.25.k_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.25.q_proj.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.25.up_proj.weight": "model-00006-of-00006.safetensors",
"model.transformer.blocks.25.v_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.26.attn_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.26.attn_out.weight": "model-00001-of-00006.safetensors",
"model.transformer.blocks.26.ff_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.26.ff_out.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.26.ff_proj.weight": "model-00005-of-00006.safetensors",
"model.transformer.blocks.26.k_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.26.q_proj.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.26.up_proj.weight": "model-00006-of-00006.safetensors",
"model.transformer.blocks.26.v_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.27.attn_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.27.attn_out.weight": "model-00001-of-00006.safetensors",
"model.transformer.blocks.27.ff_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.27.ff_out.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.27.ff_proj.weight": "model-00005-of-00006.safetensors",
"model.transformer.blocks.27.k_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.27.q_proj.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.27.up_proj.weight": "model-00006-of-00006.safetensors",
"model.transformer.blocks.27.v_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.28.attn_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.28.attn_out.weight": "model-00001-of-00006.safetensors",
"model.transformer.blocks.28.ff_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.28.ff_out.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.28.ff_proj.weight": "model-00005-of-00006.safetensors",
"model.transformer.blocks.28.k_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.28.q_proj.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.28.up_proj.weight": "model-00006-of-00006.safetensors",
"model.transformer.blocks.28.v_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.29.attn_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.29.attn_out.weight": "model-00001-of-00006.safetensors",
"model.transformer.blocks.29.ff_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.29.ff_out.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.29.ff_proj.weight": "model-00005-of-00006.safetensors",
"model.transformer.blocks.29.k_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.29.q_proj.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.29.up_proj.weight": "model-00006-of-00006.safetensors",
"model.transformer.blocks.29.v_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.3.attn_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.3.attn_out.weight": "model-00001-of-00006.safetensors",
"model.transformer.blocks.3.ff_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.3.ff_out.weight": "model-00002-of-00006.safetensors",
"model.transformer.blocks.3.ff_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.3.k_proj.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.3.q_proj.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.3.up_proj.weight": "model-00005-of-00006.safetensors",
"model.transformer.blocks.3.v_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.30.attn_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.30.attn_out.weight": "model-00001-of-00006.safetensors",
"model.transformer.blocks.30.ff_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.30.ff_out.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.30.ff_proj.weight": "model-00005-of-00006.safetensors",
"model.transformer.blocks.30.k_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.30.q_proj.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.30.up_proj.weight": "model-00006-of-00006.safetensors",
"model.transformer.blocks.30.v_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.31.attn_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.31.attn_out.weight": "model-00001-of-00006.safetensors",
"model.transformer.blocks.31.ff_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.31.ff_out.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.31.ff_proj.weight": "model-00005-of-00006.safetensors",
"model.transformer.blocks.31.k_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.31.q_proj.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.31.up_proj.weight": "model-00006-of-00006.safetensors",
"model.transformer.blocks.31.v_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.4.attn_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.4.attn_out.weight": "model-00001-of-00006.safetensors",
"model.transformer.blocks.4.ff_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.4.ff_out.weight": "model-00002-of-00006.safetensors",
"model.transformer.blocks.4.ff_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.4.k_proj.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.4.q_proj.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.4.up_proj.weight": "model-00005-of-00006.safetensors",
"model.transformer.blocks.4.v_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.5.attn_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.5.attn_out.weight": "model-00001-of-00006.safetensors",
"model.transformer.blocks.5.ff_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.5.ff_out.weight": "model-00002-of-00006.safetensors",
"model.transformer.blocks.5.ff_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.5.k_proj.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.5.q_proj.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.5.up_proj.weight": "model-00005-of-00006.safetensors",
"model.transformer.blocks.5.v_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.6.attn_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.6.attn_out.weight": "model-00001-of-00006.safetensors",
"model.transformer.blocks.6.ff_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.6.ff_out.weight": "model-00002-of-00006.safetensors",
"model.transformer.blocks.6.ff_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.6.k_proj.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.6.q_proj.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.6.up_proj.weight": "model-00005-of-00006.safetensors",
"model.transformer.blocks.6.v_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.7.attn_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.7.attn_out.weight": "model-00001-of-00006.safetensors",
"model.transformer.blocks.7.ff_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.7.ff_out.weight": "model-00002-of-00006.safetensors",
"model.transformer.blocks.7.ff_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.7.k_proj.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.7.q_proj.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.7.up_proj.weight": "model-00005-of-00006.safetensors",
"model.transformer.blocks.7.v_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.8.attn_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.8.attn_out.weight": "model-00001-of-00006.safetensors",
"model.transformer.blocks.8.ff_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.8.ff_out.weight": "model-00002-of-00006.safetensors",
"model.transformer.blocks.8.ff_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.8.k_proj.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.8.q_proj.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.8.up_proj.weight": "model-00005-of-00006.safetensors",
"model.transformer.blocks.8.v_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.9.attn_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.9.attn_out.weight": "model-00001-of-00006.safetensors",
"model.transformer.blocks.9.ff_norm.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.9.ff_out.weight": "model-00002-of-00006.safetensors",
"model.transformer.blocks.9.ff_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.blocks.9.k_proj.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.9.q_proj.weight": "model-00003-of-00006.safetensors",
"model.transformer.blocks.9.up_proj.weight": "model-00005-of-00006.safetensors",
"model.transformer.blocks.9.v_proj.weight": "model-00004-of-00006.safetensors",
"model.transformer.ff_out.weight": "model-00002-of-00006.safetensors",
"model.transformer.ln_f.weight": "model-00001-of-00006.safetensors",
"model.transformer.wte.weight": "model-00001-of-00006.safetensors"
}
} |