diff --git a/README.md b/README.md new file mode 100644 index 0000000000000000000000000000000000000000..c8a94a77ac2bf320adee8e74455c4f315d3aa768 --- /dev/null +++ b/README.md @@ -0,0 +1,6 @@ +--- +base_model: +- deepseek-ai/DeepSeek-V3 +--- + +Model converted from DeepSeek-V3 to BF16. \ No newline at end of file diff --git a/model-00002-of-000163.safetensors b/model-00002-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..eeb17d8a2e5f1febd86b1ad597dab5786eac0a1e --- /dev/null +++ b/model-00002-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46c8d1e7087f8b21218f08a9d5aaecc0fc994d1d72a3c60742d63e0809c51f53 +size 8602553952 diff --git a/model-00004-of-000163.safetensors b/model-00004-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f4176ef014e94eedea1038dd0a80be28f7ba97b7 --- /dev/null +++ b/model-00004-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf734ecca1443211236e7014c222ccc3fc6eed47e4c17008a4f40dc8a17dbc04 +size 8598786296 diff --git a/model-00005-of-000163.safetensors b/model-00005-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..36a62a6cb461d425fb8ce1e9dbcc9e59fcb952e2 --- /dev/null +++ b/model-00005-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0767b0f57b3d66ac7de995adfb68565cf80494c8efe6b62b141602edd11a195 +size 8602554048 diff --git a/model-00006-of-000163.safetensors b/model-00006-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..98c29c9cf7e818a4f943a5c41e57adc9525038b8 --- /dev/null +++ b/model-00006-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd8acbb80cd4efbc381c311af34f3cb38e83c9ad283f30a36403eb5bbe34d66d +size 8741916520 diff --git a/model-00007-of-000163.safetensors b/model-00007-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..07bab6a55b3bfc5bda64de61cb464c74b449de91 --- /dev/null +++ b/model-00007-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d220372c66d82d1c517c7f03903b5b512327f8fc0cf8cdfa1aa95fcfdd66a39b +size 8606225096 diff --git a/model-00009-of-000163.safetensors b/model-00009-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e972eb9fe671bd99f95fc454e809658c4cfe8b05 --- /dev/null +++ b/model-00009-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37104e37c405e27d699c094d02029816b04a53648eb7972f1580c753ed04f065 +size 8598786392 diff --git a/model-00010-of-000163.safetensors b/model-00010-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9acb535b2915501a45e779cd73dd048f71043606 --- /dev/null +++ b/model-00010-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:517939da636c1f04402cd46d4d6721d64bfd0c9751944755cc546902a326052a +size 8602553952 diff --git a/model-00011-of-000163.safetensors b/model-00011-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c7aec6e910552013b07027f88ab643982765aa53 --- /dev/null +++ b/model-00011-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec746068be065381c7ad63809dee0ed46158ac899836f19b7acd0602c3f8351f +size 8602554152 diff --git a/model-00012-of-000163.safetensors b/model-00012-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..abedcacaefdfd568c60ce1eafe040d3bcd0ad711 --- /dev/null +++ b/model-00012-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55a0b691edb9bde14a67abee926f8d578d850a441e7d6dd3022384ce4271f904 +size 2642451624 diff --git a/model-00013-of-000163.safetensors b/model-00013-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..abb8599d59cbe16e2bd445a4b78992c69988ed40 --- /dev/null +++ b/model-00013-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf391d4cdf384c4d87fbdc9f104525e4140bc06386786bcacc76bc0a98e1c65e +size 8598757320 diff --git a/model-00014-of-000163.safetensors b/model-00014-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4d53b651cad837da6c3a2cc32eb858181211e07d --- /dev/null +++ b/model-00014-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eea116b40f6b5950609ebf73d5000b75a113d202279197228a998e8af69f09cd +size 8602554136 diff --git a/model-00016-of-000163.safetensors b/model-00016-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1e4f2a35647b1f6189de5bc4eec263743493869f --- /dev/null +++ b/model-00016-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a01f0e8eee20014c3ab7c22c557576aa25cd875f36047595f0064cab4ce5214 +size 8602553936 diff --git a/model-00017-of-000163.safetensors b/model-00017-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8c78e68df9b8efae459d7e83a0c46671554fc845 --- /dev/null +++ b/model-00017-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:108e5b0b11c4434f5f122b3fbf822b82c0298af9fb922075c8b21cdc03098f11 +size 8602554152 diff --git a/model-00018-of-000163.safetensors b/model-00018-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..035d47a8faca332837deba997063d0eba55e2c43 --- /dev/null +++ b/model-00018-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bc96b23235009b47592ebe8bc1309a51d9ec31843441515d4817d519123cdea +size 8598786312 diff --git a/model-00019-of-000163.safetensors b/model-00019-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..82c88fef17318da8319bfb6330b11d229f0eb372 --- /dev/null +++ b/model-00019-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba9318f5e369e777db0f68d422095f4bd90cf877881fe43ce911ca816aa7fd05 +size 8602554032 diff --git a/model-00020-of-000163.safetensors b/model-00020-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4d09e2c2924690f843e3304670562c36f0855c05 --- /dev/null +++ b/model-00020-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:789f810ae9cb33d8ece443eea09e6b22776389474081ca16448377dcc0ff5f0f +size 8602554160 diff --git a/model-00021-of-000163.safetensors b/model-00021-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a9edb0521e77b3a9d9290e071143f0e8b26410e1 --- /dev/null +++ b/model-00021-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bb39bbcdb229c8b8993d22c6e22319e8c18499cb7752383b0d9231ab231a66e +size 8598786512 diff --git a/model-00022-of-000163.safetensors b/model-00022-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..dbe896330c3f28787d3a10a90c877b6667768b4c --- /dev/null +++ b/model-00022-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da00a7b77a294a3d0089a0f2b91b3461aaf81f4323e13cf1d08826ad14741528 +size 8602554416 diff --git a/model-00023-of-000163.safetensors b/model-00023-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b6989a1540afa7b2f1d179709f3812a532a44898 --- /dev/null +++ b/model-00023-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:417aa003b43c85c89ab8c066cc9edff8091ba4b425457a49103a07e12d6f87e7 +size 8598786704 diff --git a/model-00024-of-000163.safetensors b/model-00024-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d7317f8cf5f7c138a2dd22176745e01c698101b0 --- /dev/null +++ b/model-00024-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c31144a6d63cc65a7b41dd128b40f39ec8b50a0b600e0e4fe96681cdbf329e7 +size 8602554224 diff --git a/model-00025-of-000163.safetensors b/model-00025-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2afa48020aae506398ae8eeb938c2343076beb68 --- /dev/null +++ b/model-00025-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9158672262b6a853685ac5114d64c7aeada871f9a8316a74ebe1dbcf749e6c0a +size 8602554448 diff --git a/model-00026-of-000163.safetensors b/model-00026-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a1695ddcfd812773560306ac3459051b0ff9840e --- /dev/null +++ b/model-00026-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56f04552900d25117f2f37669e26c6e575de80b1858f918884707b1a56b09fe9 +size 8598786616 diff --git a/model-00027-of-000163.safetensors b/model-00027-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b8c1b399fca1b8de65da51b9755920d73e5c2da3 --- /dev/null +++ b/model-00027-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3495f7f4f46324f7620c811f071b2c814e78b7fe8e2a3ef93e6a6b0686b252d +size 8602554312 diff --git a/model-00029-of-000163.safetensors b/model-00029-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..130d51317a5942dcfef5d1db0d70c3b68e20ef85 --- /dev/null +++ b/model-00029-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2dfd7c4840e950e28ea1382e044def209cecba4492e97a85844d1bc36787683 +size 8598786520 diff --git a/model-00030-of-000163.safetensors b/model-00030-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ea7648eebd2a2fc5bf3a6f4e65d6ac497a44dce9 --- /dev/null +++ b/model-00030-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0946f9f0b1df2d791dcdc62e035706785782ef3b54cb63a4be4ba6928aea7c2e +size 8602554408 diff --git a/model-00031-of-000163.safetensors b/model-00031-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..195c1a8869c12abfb67ba066d558cb8e12deeecf --- /dev/null +++ b/model-00031-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7341e3e46145da3eb9426d8981ea9defd12e757f98316a91d80b24dba8fd8afb +size 8598786720 diff --git a/model-00032-of-000163.safetensors b/model-00032-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fd9099bb72fdc08b0b6a1679ac285a126ef555d6 --- /dev/null +++ b/model-00032-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db7904e879aab9bf0eef52e702940a98424815f4e5032f41713eb55f320e87b4 +size 8602554208 diff --git a/model-00033-of-000163.safetensors b/model-00033-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6d6b81837ef894435bedc2d10f5caf1b88f17d03 --- /dev/null +++ b/model-00033-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b85285a4710fecf5882a91946fb8162e6e79669f0c4bb007eb9197b2db4a4515 +size 8602554448 diff --git a/model-00034-of-000163.safetensors b/model-00034-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1da0c3d5495d01f59969b19bba77f5d7be8f517b --- /dev/null +++ b/model-00034-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eee8c3ad83a7ededf3ea8d262e94e0420a6e59c4639f043bd77b5671845dd4d7 +size 3493899088 diff --git a/model-00035-of-000163.safetensors b/model-00035-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..de148586557e14c57bc49c292040d1e948334787 --- /dev/null +++ b/model-00035-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de99119bc64b00dde477df67deb2098a46c67d51e8ad79757abc1a7db4de1796 +size 8598757608 diff --git a/model-00036-of-000163.safetensors b/model-00036-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..43334bf98f9396808e926246f2c40232511afea8 --- /dev/null +++ b/model-00036-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd71bcbd2f361e5a7273ca75114df82b5d7b95403cce6e054ea6410bd87a308d +size 8602554424 diff --git a/model-00037-of-000163.safetensors b/model-00037-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fa9fc5c4205315c7a5c537129777f977ad739b0c --- /dev/null +++ b/model-00037-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2650de3dc3161ddd56a8ba19e6a466e61618bf47c5ae416ff6929ecea9dcdebd +size 8598786704 diff --git a/model-00038-of-000163.safetensors b/model-00038-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b4cd8c14408aedcc2c83d6b00c2bac1b19d27533 --- /dev/null +++ b/model-00038-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64a7da90ab1f8bf5e2d6bfeb5436c80d2ae490afd7f5ecb1d059080d43edc1ac +size 8602554224 diff --git a/model-00039-of-000163.safetensors b/model-00039-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5f643fd3ac97f3ba92623559d2882757ae47c9e3 --- /dev/null +++ b/model-00039-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88f6e676ae754fe8b467e5edde5305d2b7935eda69550df3e37b1aad95879d14 +size 8602554448 diff --git a/model-00040-of-000163.safetensors b/model-00040-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8714555320316f1b918ab5e45e0c03cc8fe4d2e3 --- /dev/null +++ b/model-00040-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7697b9d1b540f88fa123b49db77e3855296ef97740a7d9a7dae0d333399965c6 +size 8598786608 diff --git a/model-00041-of-000163.safetensors b/model-00041-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..57820c78017267de9dcab44864b2dd002d9ed4c8 --- /dev/null +++ b/model-00041-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85d4368dbb86b263c36519411105a78ccbac05c83533899af01805604ec07fbb +size 8602554320 diff --git a/model-00042-of-000163.safetensors b/model-00042-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a48fc6aeaaee0727e6fb5b56e0146b01c3be91c6 --- /dev/null +++ b/model-00042-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79052a7916a0afacd7de3ece97e05d46de1c897d35ea4ac5ad313e4c88c49b7b +size 8602554448 diff --git a/model-00043-of-000163.safetensors b/model-00043-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..affd7d31d194a4a73a6c8da917f02128202fc1ab --- /dev/null +++ b/model-00043-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24eb59dff737983f81efc519728277af6593c27271bcceb515eb8cf70ab68efb +size 8598786504 diff --git a/model-00044-of-000163.safetensors b/model-00044-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3b2641a7895dd2f1067757c36e96bdd919f199c7 --- /dev/null +++ b/model-00044-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8267d7f4dee8cc1d41c4671b9d7d58a0f43010b5a77d1ef3baf4cae52a6a2b9f +size 8602554416 diff --git a/model-00045-of-000163.safetensors b/model-00045-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7bf1ab49c6cd934412b472c78bed42af242b203c --- /dev/null +++ b/model-00045-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73badad06ce95b1f6edbbfb1ea32891652befea30752d7a4c19483c7b9665de6 +size 8598786704 diff --git a/model-00046-of-000163.safetensors b/model-00046-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8eb920e2398391bac31c78b281076ab43454ee82 --- /dev/null +++ b/model-00046-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9df2cd5d19bddf28175e7de39a5fa3827d41cbcc8c5ceb51faeaea0a9232078 +size 8602554224 diff --git a/model-00047-of-000163.safetensors b/model-00047-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8bbd6b8e7b954f911e257c64abacfa810a5f5fa0 --- /dev/null +++ b/model-00047-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c56f0f8cc8aa391931513f6baf178c4cb47c4c10a6576ebe381b0b5997c5e591 +size 8602554448 diff --git a/model-00048-of-000163.safetensors b/model-00048-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c38e44693c97c80b657ba36cdf00a22c2fbbd29d --- /dev/null +++ b/model-00048-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b994f93d74881d80c25417ac15aa846993ca1fa595a17c342a20d0328600484e +size 8598786616 diff --git a/model-00049-of-000163.safetensors b/model-00049-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..30da41772f79a4f0cb4b5051226c78adddeb351a --- /dev/null +++ b/model-00049-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e26187be10a9bba28c7156a2db5966da7dccc9df5e2d4ec2f3750b9bdc5f4aa1 +size 8602554312 diff --git a/model-00050-of-000163.safetensors b/model-00050-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..29d8c01835b63674079f426ccc5b5193c3dff24d --- /dev/null +++ b/model-00050-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1553e307fede0ef31af2c8f201c3d963dbbf5d500948b2c5e3257b4d148ada19 +size 8602554448 diff --git a/model-00051-of-000163.safetensors b/model-00051-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..41f6906ec2338fa82515b9d632ae2f30e3a79bd7 --- /dev/null +++ b/model-00051-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:591941ad931ec204e33a1288ad1c649298951ec6025ff728048205d4396cb5d5 +size 8598786520 diff --git a/model-00054-of-000163.safetensors b/model-00054-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..722c064c24ce034ca18d1c179f14b3226e309410 --- /dev/null +++ b/model-00054-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81e697df492ac9ca70a2aca90e3973040df5586959b37e502b0fff422b22756b +size 8602554208 diff --git a/model-00055-of-000163.safetensors b/model-00055-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d4d72da91fdea69dd2c8639ab0994898342f897e --- /dev/null +++ b/model-00055-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddebfc2516b69d536b8e89298e0d7f7901651ab9f67323f6ab60eff46ccf15e9 +size 8602554448 diff --git a/model-00056-of-000163.safetensors b/model-00056-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..01a311c639813b0a87fbccf672ea867bc3591f70 --- /dev/null +++ b/model-00056-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04a1e404de4bf2528c6bcb3c5f2676323129d5f74d850342420d0622b6d05466 +size 3493899088 diff --git a/model-00057-of-000163.safetensors b/model-00057-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e253bb3d5866fa96e9a73055c9cd2d4308fc8747 --- /dev/null +++ b/model-00057-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1111fcc2fb2e843af362ba0630cc34e34a3607ee8d93c3cbfe0093b7f5ebeb84 +size 8598757608 diff --git a/model-00059-of-000163.safetensors b/model-00059-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cfe155025a5413ba73a21ca82a3350895a8f3464 --- /dev/null +++ b/model-00059-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3135e5f89919b3da8c62f1ac1ccf925b1f859f7f387e63f75cd096c97928c29 +size 8598786704 diff --git a/model-00060-of-000163.safetensors b/model-00060-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d6728e64790f93cb9287ce410914fce0c11464dd --- /dev/null +++ b/model-00060-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e99c18540d723f5fcdf1a661ef7f7958b8b61ec50861b0817809d2018b143b51 +size 8602554224 diff --git a/model-00061-of-000163.safetensors b/model-00061-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..397fcc4acc4bc6698d602b5c89ba87fd64fa9e89 --- /dev/null +++ b/model-00061-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e836b52d111a06e7cba4e3fdd2135d1f982358fe368d0c0ae9b79151f9dde2c0 +size 8602554448 diff --git a/model-00062-of-000163.safetensors b/model-00062-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..55d9ec8b38fa50fec6d215be30aacb62e20898c0 --- /dev/null +++ b/model-00062-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c79e1cf1490ff7809d55dfc93a3a4cbec287b3c6b32425d8442a8c75b07a07e6 +size 8598786608 diff --git a/model-00063-of-000163.safetensors b/model-00063-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2243d4038b004dfb5c2686210718cc64f0c3369e --- /dev/null +++ b/model-00063-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e253f9625af6dcdd18247c19286373aea0ff6718c9bb135fb727f5f2165a29d +size 8602554320 diff --git a/model-00064-of-000163.safetensors b/model-00064-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..71c918fbff0276de9115e9428e8882ef9b86fd91 --- /dev/null +++ b/model-00064-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fd8d966106988a8688daa32888a0e4ec38590bb8b52a896b2b8895e02976efd +size 8602554448 diff --git a/model-00065-of-000163.safetensors b/model-00065-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b84308ddf2e91dbd947a0d33eeccfad86b0bfea7 --- /dev/null +++ b/model-00065-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f5dfbf92537847a20c9d79f0197b77a5f8a39412415a576ba230a11de45a8ed +size 8598786504 diff --git a/model-00066-of-000163.safetensors b/model-00066-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..85a9d656359080704613428e9a9be8074a5ad3c0 --- /dev/null +++ b/model-00066-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:730fef963c12be9e7aacca5dfd5a51b3ef39235157a06ed719fcf4679d1a04a9 +size 8602554416 diff --git a/model-00067-of-000163.safetensors b/model-00067-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..80e98e88964e37df24e66818800528af3dfa3b72 --- /dev/null +++ b/model-00067-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2159cafa1886aed906409e222f6a04a3e269289fccac1fa3354fd00acc1e277 +size 8598786704 diff --git a/model-00068-of-000163.safetensors b/model-00068-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8416356a0285a306668ebfd2a07cbc55c9701f2b --- /dev/null +++ b/model-00068-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d86ebf76fed0bc536443fd8d59fab2dc84e90e7370a22755d1a6b5a13939c4d9 +size 8602554224 diff --git a/model-00069-of-000163.safetensors b/model-00069-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d920333f521c34b18e965cee6921e1279638d67d --- /dev/null +++ b/model-00069-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1bbbf62c30af3900cc7abc9685f5c9da5b54b200296a666dce70eb7674cf207 +size 8602554448 diff --git a/model-00070-of-000163.safetensors b/model-00070-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..af563a44eb7e47bef964fa09e37566b38d37f65e --- /dev/null +++ b/model-00070-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de25158427abcca63fab14ec3b062c686a91596227cce348c32f28f0a0e115e5 +size 8598786616 diff --git a/model-00071-of-000163.safetensors b/model-00071-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9bacca186818c489991d8fe00c6e1147a642868e --- /dev/null +++ b/model-00071-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d010b11aa846befeb51fd8df451cab0b06aa66603a9a510a365c68a5e164d67 +size 8602554312 diff --git a/model-00072-of-000163.safetensors b/model-00072-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c3a4f78a01c534f423d611f2852898213f8399ed --- /dev/null +++ b/model-00072-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7528bde5ec837d6f19013b24c2013432679e0dd15fba27b0aa0b5c0385cc2bde +size 8602554448 diff --git a/model-00073-of-000163.safetensors b/model-00073-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2404b61a11e09e4e0602f720dd83e9627dccc5ed --- /dev/null +++ b/model-00073-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5520ab09fcad371d7b62b8ecbc14608e01282dbb31b08148589c7eb392e45f2 +size 8598786520 diff --git a/model-00074-of-000163.safetensors b/model-00074-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..55e2cd1f54cb448d7619576c763c8fcd1857a7b0 --- /dev/null +++ b/model-00074-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b70392f0c2e0c8b9e7b1b562ec9c2366f17889224a7845412506481f771ae29 +size 8602554408 diff --git a/model-00075-of-000163.safetensors b/model-00075-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e0baeb676946cde5fd9010283c256752d7bfee2e --- /dev/null +++ b/model-00075-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9e57f92b97dc60f2d4d8b40b18ea3a2ab91a15046ad5c7046d24e1ec3b4a531 +size 8598786720 diff --git a/model-00076-of-000163.safetensors b/model-00076-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9c70a18c1b5b53ef40b7a2d807b7c35cbe092c78 --- /dev/null +++ b/model-00076-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0aca48d6869d6cbecc464e1e6ba39daa316384c2cedd713672e36c2080a2b61f +size 8602554208 diff --git a/model-00077-of-000163.safetensors b/model-00077-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..91a04756e0120ade0e2d4d2b9278374f9679b00c --- /dev/null +++ b/model-00077-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf8f628cf3141e624906f7926cee69ed15a4648e1bd45589404cbd3c835d91f5 +size 8602554448 diff --git a/model-00078-of-000163.safetensors b/model-00078-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f6d296329a9619125bd38dd3b40c446d3ef3e2d4 --- /dev/null +++ b/model-00078-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:709137ba0ac4f1d7aeb1da7efb536afa92e5fe738cb69c2ba57854ac727a9cd3 +size 3493899088 diff --git a/model-00079-of-000163.safetensors b/model-00079-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7189a7947658bd45016a81adba9d7aa531d724dd --- /dev/null +++ b/model-00079-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b292c546b8519bcdb35c8d531689afed6dbeba8425a8bdb8426f6e4d571bbab6 +size 8598757608 diff --git a/model-00080-of-000163.safetensors b/model-00080-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d15005c760dd7c161c29b984ff796fe6e776dcc2 --- /dev/null +++ b/model-00080-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0382a6e9b21b609f99070ef71f9e187a96880ca3fec477bc661eeadfacf7be6a +size 8602554424 diff --git a/model-00081-of-000163.safetensors b/model-00081-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3f02b144c60304403f9f22a822d04646d954d131 --- /dev/null +++ b/model-00081-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f83953089ffb9b8f2ad58c9e8a8a2fd24a3871f496b088fe92b886ff9810a4d7 +size 8598786704 diff --git a/model-00082-of-000163.safetensors b/model-00082-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d902406ee71eecdbb4f4c9ef7548b0e84c54a07d --- /dev/null +++ b/model-00082-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1400178981b98b6fcea4c2790487ee455b094ba625a4f4017d263bf4c51d6cff +size 8602554224 diff --git a/model-00083-of-000163.safetensors b/model-00083-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..35c89aea1c1c13f2840d85881f5bccb38a917e13 --- /dev/null +++ b/model-00083-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb636ae5dbc874ecfc0e62c38d41b38368a02359662577bd34894b6ff8af3648 +size 8602554448 diff --git a/model-00084-of-000163.safetensors b/model-00084-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5aa368d9d552a8960bf5dc4d9ed29536c29f7ac8 --- /dev/null +++ b/model-00084-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:293ef17b03c7a88cf52d8995b1b5de1dec096477934d74fbe113a673330f04b2 +size 8598786608 diff --git a/model-00085-of-000163.safetensors b/model-00085-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a4c3ca84bf0a2c33f9ed73484266f596638976cb --- /dev/null +++ b/model-00085-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6a139d5ec636f3b47e5b5793e1fbf4d69db5406e832adc9dc435d068382c7d2 +size 8602554320 diff --git a/model-00086-of-000163.safetensors b/model-00086-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8693b8e16999b16ba19df5be229d19cb8f18969c --- /dev/null +++ b/model-00086-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4aa570fdc0ab59a7925ca36529763aabbcbe9f980097a923753c361e435ced7e +size 8602554448 diff --git a/model-00087-of-000163.safetensors b/model-00087-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2b7a4fd4f054c26b12b9476c88a42fc158a0d542 --- /dev/null +++ b/model-00087-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96f2bf89abd495f96e0a1cb37cffb33335a50ccd6f5efc605178d0115383155e +size 8598786504 diff --git a/model-00088-of-000163.safetensors b/model-00088-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6727c9b11d6d775b2cb2056735884fa50cf9bcc4 --- /dev/null +++ b/model-00088-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20eb1d24a906c9858a4ae8ba8e1976186c423ea3abb0ab3d9f25a66c6e142f23 +size 8602554416 diff --git a/model-00089-of-000163.safetensors b/model-00089-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..df34f57c470a80771cbe6202d71e5e0671f9f2d8 --- /dev/null +++ b/model-00089-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e47e21b3456415a9fb264651366444a7addd7c0e254a7528a02b2c3974c2aa25 +size 8598786704 diff --git a/model-00090-of-000163.safetensors b/model-00090-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b2691729db0ab78d3387457740e4a9e204a0e0c8 --- /dev/null +++ b/model-00090-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:127c7d477cba9d30978a3bf7e01597eaab34e973d108c1ecdc75d353637035e4 +size 8602554224 diff --git a/model-00091-of-000163.safetensors b/model-00091-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9f941e70133ed2753b8ae93e75840db9a51725b9 --- /dev/null +++ b/model-00091-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59bda264bf19143af751e99c9c4652d0e1ad7db8a6116041493082c6dd642ac6 +size 8602554448 diff --git a/model-00092-of-000163.safetensors b/model-00092-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bd9b89aeee7aff98b1a86dda91497607a3ff1361 --- /dev/null +++ b/model-00092-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d995dca3216805917ec89495113ffc59119b7c3de085916fd43aa36d5e61435c +size 8598786616 diff --git a/model-00093-of-000163.safetensors b/model-00093-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2d3c2ca646df3fb455d173866a86584cecba52cb --- /dev/null +++ b/model-00093-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca49bc8e6cf74175ddf2803c4127447ce288f6fe972a68f79b593cdbb9571e94 +size 8602554312 diff --git a/model-00094-of-000163.safetensors b/model-00094-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..42653203279c3d9122827f2a9ccbb390b1b92779 --- /dev/null +++ b/model-00094-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:617ad15bb31015aaabdc776dc7843e7cd19bd9d219703238c427dbe716140bc3 +size 8602554448 diff --git a/model-00095-of-000163.safetensors b/model-00095-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e74bb3a2c5cf7243f7d8f708c1d25a20e4ca3b88 --- /dev/null +++ b/model-00095-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5290a9621cbf01bec4df562da3df33f3bd5f60ebdb6831c3ea3bd5fd1c944da5 +size 8598786520 diff --git a/model-00096-of-000163.safetensors b/model-00096-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4b413d7c50f9ce3cd010f4e94374ed10621b6dd8 --- /dev/null +++ b/model-00096-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13a49fd3660aed947cb0361e66d546f23ac34888795d682648d698682035bb82 +size 8602554408 diff --git a/model-00097-of-000163.safetensors b/model-00097-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e8e96542adcc2a385b324de319f56cde3c188858 --- /dev/null +++ b/model-00097-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb89c1918422f8ada7401f5c556ac9fce1c2b317e1e541bf8f162fca6e431f94 +size 8598786720 diff --git a/model-00099-of-000163.safetensors b/model-00099-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6468025cc6f82becb371dd2751a46703687eb827 --- /dev/null +++ b/model-00099-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61a87ded442a716dbbcb721ba8639a48ae6cc02e0da993ffb2a24b3d100ec14e +size 8602554448 diff --git a/model-00100-of-000163.safetensors b/model-00100-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f4f99292ca950cf264cb8b263bc511b15683f8a3 --- /dev/null +++ b/model-00100-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f96ef067359e5b95763bba79c57bdfd82b751e7ae0d23551b80349f705b881c0 +size 3493899088 diff --git a/model-00101-of-000163.safetensors b/model-00101-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3a984771fe68d72807a5eccb65d724019d3a6148 --- /dev/null +++ b/model-00101-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7074b2250a53e19431824c0939dbb9c191ef3ff6bc4f8d1d52b4de249dec83b1 +size 8598757608 diff --git a/model-00102-of-000163.safetensors b/model-00102-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8ee650e95050b7ecc48e9351e482425e24a655df --- /dev/null +++ b/model-00102-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:458740495efb9d24bad77cde3e38566d3ca5e9e8dd08fa78090094430ab5b4a9 +size 8602554424 diff --git a/model-00103-of-000163.safetensors b/model-00103-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f503afe50aa31a42a1f7dc634da5056e940c31b1 --- /dev/null +++ b/model-00103-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44f6e8c15183d03492f02bbd6f816baea4e16f14a00314e871261a40cf95dac8 +size 8598786704 diff --git a/model-00104-of-000163.safetensors b/model-00104-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..957b27757560cff84d5ef5d9c3af164e2ecae850 --- /dev/null +++ b/model-00104-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f5a8b3857262a3ac2c2cfcbc8803e20c7b8d2c571f5d1c80c72f5d60f5c7b45 +size 8602554224 diff --git a/model-00105-of-000163.safetensors b/model-00105-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..08632c006f1ee2aca08c0904ddb3229a5b244968 --- /dev/null +++ b/model-00105-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6eea3e875d88c5c34431225cc01a33895bec81adfd1fcdc8015cd953435497c +size 8602554448 diff --git a/model-00106-of-000163.safetensors b/model-00106-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1e67ed81fe3f4b5c88306e98e4d5b13da905b56b --- /dev/null +++ b/model-00106-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f103274883e65d26f9e4d576ae0b4b2ca469792d9533c2ef61aff88f8f985e7d +size 8598786608 diff --git a/model-00107-of-000163.safetensors b/model-00107-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..931a4eda596b62e761359db184c64729dba9072d --- /dev/null +++ b/model-00107-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e354d225e056e9b2c66eb813c4efd55ac89279d07319d646cdbe5c652eab209e +size 8602554320 diff --git a/model-00108-of-000163.safetensors b/model-00108-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d63e793b047e335b3466fd917ea6a044a00c895c --- /dev/null +++ b/model-00108-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34f8981abdc1471bbca3e34f976c5b56bbc0f68195d8245c374c9f95b39fd6e7 +size 8602554448 diff --git a/model-00110-of-000163.safetensors b/model-00110-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fb5f7b82b0bea15b747bc655d772c6db907162cb --- /dev/null +++ b/model-00110-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74023dc41dfa4be71a067f6dfc89a0322cc0c69dd548a90836772aa84b97b7e0 +size 8602554416 diff --git a/model-00111-of-000163.safetensors b/model-00111-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e91bce175974509aaa33fbf71405ea64768b7319 --- /dev/null +++ b/model-00111-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:815cc809666231efcb99ba11e60da103fc1d0091b962266f507e16b550a03e95 +size 8598786704 diff --git a/model-00112-of-000163.safetensors b/model-00112-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e5bcee5acac1215a03fd14960b10603d7dae148c --- /dev/null +++ b/model-00112-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72ac3ff8759214cd59739b97c55b1452a28da307cfba8fd0d67fc9ad900f06f0 +size 8602554224 diff --git a/model-00113-of-000163.safetensors b/model-00113-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2e9aef8794f49a5f376664a117cf1f9393f3f097 --- /dev/null +++ b/model-00113-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:164d5287b12a2c2f8fa1e886fdbe335ac4efc61db2098fd510a043d58ea8800b +size 8602554448 diff --git a/model-00114-of-000163.safetensors b/model-00114-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..83dbfba9c5bc441a96f3fa0df577ecbade333bc7 --- /dev/null +++ b/model-00114-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5cd3f1de6e37449a18a87c4561fc75e1d284604ff91c524a0fb8993145b157a +size 8598786616 diff --git a/model-00116-of-000163.safetensors b/model-00116-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..be22c191961b5c2cab8c36821ecd34b46da0eb7f --- /dev/null +++ b/model-00116-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b31df58ddc80ac59003265ec05650820c77d46b195ec4f69a76bcf2fbd6699d +size 8602554448 diff --git a/model-00117-of-000163.safetensors b/model-00117-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..84bc4ce1f347c6336c61bb4e3620d93e4cb8e89c --- /dev/null +++ b/model-00117-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22d30d50c324e77862c6408352863fef0e75bcb0b3433392cfbe2d37c6d6783a +size 8598786520 diff --git a/model-00118-of-000163.safetensors b/model-00118-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4f9d89d1269efee0cbabba177f25522bf93ed209 --- /dev/null +++ b/model-00118-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8d82a9579ee65e049c876e7393f1eb44442180ddf6e862496b37f93fb173daf +size 8602554408 diff --git a/model-00119-of-000163.safetensors b/model-00119-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a4b7fad097f8e72f2bea5de44f619bf69153e380 --- /dev/null +++ b/model-00119-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:851fa932e257d508920fb7e8fdac68e7141043ba85b81483101f3f17ad633778 +size 8598786720 diff --git a/model-00120-of-000163.safetensors b/model-00120-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6dfd9e09b1666acc0b351725e6dec9df85bc233b --- /dev/null +++ b/model-00120-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49c78946da88c432a69fbb8af49e63929bef09e81d0f2e986897c1a996b1c0fd +size 8602554208 diff --git a/model-00121-of-000163.safetensors b/model-00121-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b57b5b0380f17cc07bf25ffbaf25eee62711e899 --- /dev/null +++ b/model-00121-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30c02486e286a60e9d1c7ac6a269626e8124551ff03d8b7dd6eb600efd4b621e +size 8602554448 diff --git a/model-00122-of-000163.safetensors b/model-00122-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cc0982ce7dcfabd83aada7e24bfa0fea1539b122 --- /dev/null +++ b/model-00122-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78c6a3ad51594f4dc29adb60c1f5cfb638608d989f61e6dddac20d90c1e96dc6 +size 3493899088 diff --git a/model-00123-of-000163.safetensors b/model-00123-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0ab2f6251bdeed755bf5ba19538f593bbe007c05 --- /dev/null +++ b/model-00123-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbd41f1fee6b357f944220dc4dcddbcade5f9b8470101d966288a3ccadc3dad8 +size 8598757608 diff --git a/model-00124-of-000163.safetensors b/model-00124-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c2b3510162d70f3050fe80fc80d879a8dcabca5e --- /dev/null +++ b/model-00124-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ded998f520aac0293c685364477d838ff47de7cb00d8d99ffb715db0a5cf7bac +size 8602554424 diff --git a/model-00125-of-000163.safetensors b/model-00125-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..85c4ee0d6dc5332b6b4fe7ffa26b3aa946a35859 --- /dev/null +++ b/model-00125-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c58db91e9b1b55253fe18246c6980172760b881f681af2afe06f77dac35a00d +size 8598786704 diff --git a/model-00126-of-000163.safetensors b/model-00126-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0addf2d4a14a22c370d754e164537b5e15c71057 --- /dev/null +++ b/model-00126-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:413d3fa6890d0b40fa5432e2b3c1cbe0c275d8500a78bb5ef7a224d11ce44264 +size 8602554224 diff --git a/model-00127-of-000163.safetensors b/model-00127-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e2e65df8a5e74c9940ee386b8fe2b316aaeb4f42 --- /dev/null +++ b/model-00127-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35423b23c410bd3374d7e2e30554ad184b4dbf411fc9147673bccb814d5ae95f +size 8602554448 diff --git a/model-00128-of-000163.safetensors b/model-00128-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1e2871365ce07b2df46bc2b5dc56be2e82d5ed0b --- /dev/null +++ b/model-00128-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f827d60974bc770a243d37811863c5bb738ba8988e2bbcd751e8d240bbed0477 +size 8598786608 diff --git a/model-00129-of-000163.safetensors b/model-00129-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..279ff835e347fb8498b846bdf12f21658e642968 --- /dev/null +++ b/model-00129-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbb91d02398a2b06713bad0b8998cde0e81daf0f4bff96fd8381a8b91efe8ecc +size 8602554320 diff --git a/model-00131-of-000163.safetensors b/model-00131-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..93d2689c5fac260fab6a39f3410955c3254e8e36 --- /dev/null +++ b/model-00131-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccabf2d1c83e6172adae62ee3fa2748dd2b8841d0f88830097906d79d9ddb271 +size 8598786504 diff --git a/model-00132-of-000163.safetensors b/model-00132-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..97265b5a08e0f7586365770c63e119a3cdaefc12 --- /dev/null +++ b/model-00132-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64ddfd3a45e31b658853456eee86cc77332c2bffc5a5d28eb2cb9fa91342e4c5 +size 8602554416 diff --git a/model-00133-of-000163.safetensors b/model-00133-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e7b749cc2a0af94556cfee53d8b58e6a64f34fb7 --- /dev/null +++ b/model-00133-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:531922d0532e37a3fc2854e17983518fa1c8ea0fba07ca0dd53c510c10977697 +size 8598786704 diff --git a/model-00134-of-000163.safetensors b/model-00134-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ffd0aaa34b4e124848fefe4d0423b5380ce98753 --- /dev/null +++ b/model-00134-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7b8f4e670ee01cf90990744b8023ffafdb01c42d05ee1ac99f444f7224041d7 +size 8602554224 diff --git a/model-00135-of-000163.safetensors b/model-00135-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..21ec62d723c50965dbc6b9574dc1754878497de3 --- /dev/null +++ b/model-00135-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff7dc483b303362c6dd1a6106d541e2e46fb09f7a76fb9509b080cf8e6c75489 +size 8602554448 diff --git a/model-00136-of-000163.safetensors b/model-00136-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e472539ae889a4a4a597141f7fd1e1608be65b21 --- /dev/null +++ b/model-00136-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c08905b11ac4a7770f22c40874a0cc19f5e83e1d780b9c2721c2cc279e39f9d +size 8598786616 diff --git a/model-00137-of-000163.safetensors b/model-00137-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..72b8e92fc03c012bda809c7c7acb53ba70dc2b0a --- /dev/null +++ b/model-00137-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a585d6c18c17b37158a462acaa42747c86343c086f5309dab9dff73f25630395 +size 8602554312 diff --git a/model-00138-of-000163.safetensors b/model-00138-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1942cdd29f5843bb1778961ad5e9855efcd6a400 --- /dev/null +++ b/model-00138-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75eec42a418a118ecbc5b2b64b1a514e1d1797631b88c37840f8032d7fc55186 +size 8602554448 diff --git a/model-00139-of-000163.safetensors b/model-00139-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..846223420558e53bb25c5e4e796941cfe91ecf63 --- /dev/null +++ b/model-00139-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76cafeb1be75ceefa34fff23e0f1ae564215a384ca31bafc652b871324c9f707 +size 8598786520 diff --git a/model-00141-of-000163.safetensors b/model-00141-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..874e2adcd7a4cc3189850809d5925346f822ca99 --- /dev/null +++ b/model-00141-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b78531b78cc2f15924a1f2b122c232dd48d6ad68572477d68e13d12a2b643e8 +size 6283123256 diff --git a/model-00142-of-000163.safetensors b/model-00142-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..eccf0f93ea97743255922a01517ca9b62eb0639c --- /dev/null +++ b/model-00142-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a31f354b6a7d360569a7ac9e1ce3385b0ad8fb7f1cf44f4ba73ccfdd5dca7e09 +size 8598757608 diff --git a/model-00143-of-000163.safetensors b/model-00143-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e2536a0e7d9f57673a1acafc3deb69a509bf2e2c --- /dev/null +++ b/model-00143-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4ad90df7c763f7c1f4220822810d03fefa6fb9a28b5b83ac8eca309f6cf4cb9 +size 8602554424 diff --git a/model-00144-of-000163.safetensors b/model-00144-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..09275ce560f082780f95fe03fe13ad3eefa9748d --- /dev/null +++ b/model-00144-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecd8e99dadc48f3e75f4957fa0b49961e51e1cff91d4abdfdf9c2bd451639da1 +size 8598786704 diff --git a/model-00145-of-000163.safetensors b/model-00145-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6ca3eba374a42e1ec884bd0565e4f3f72a044fb1 --- /dev/null +++ b/model-00145-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f96e5ae2644c0d5385a70e7247c9cdf961c558826662e30a3d0d1b2ed8c272d3 +size 8602554224 diff --git a/model-00146-of-000163.safetensors b/model-00146-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2b0f1bb13b030ea770e46a0b910a68d342de7954 --- /dev/null +++ b/model-00146-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:464bf5e47859eccbdf0e3f14005ceace4506eb324e572bd0e23032a0458bf1f2 +size 8602554448 diff --git a/model-00147-of-000163.safetensors b/model-00147-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7efb2a07ce2c9300039f853cee5bc5127c7111d6 --- /dev/null +++ b/model-00147-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f635c76f05ea0e12b00a37672ae5956587dcbf2f3cb3e627420adb96e6d6bfaf +size 8598786608 diff --git a/model-00148-of-000163.safetensors b/model-00148-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ca8cdaae09f6050daa03deaf8160c3fc074ac40b --- /dev/null +++ b/model-00148-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19a9c6cefed2b3211fd7d3a13ae9917f2dfe436f337947633fdf05e7e1cdf626 +size 8602554320 diff --git a/model-00149-of-000163.safetensors b/model-00149-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b334715dc0523fb28589380ff4bdf3d4be208b7d --- /dev/null +++ b/model-00149-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18224a4d22a086f1bdab986860d87ca1d73ed7bde0c23bf613ecd881497b1d78 +size 8602554448 diff --git a/model-00150-of-000163.safetensors b/model-00150-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e56c6fb5e023161b3d17391cf79b1c15a18c0839 --- /dev/null +++ b/model-00150-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:370798911671568b089e45ca86bba8a0a78090ea0827dc5209ec7797d7c15644 +size 8598786504 diff --git a/model-00151-of-000163.safetensors b/model-00151-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9ffc5e1f40a90d0ca77b6d94d4217d589887b928 --- /dev/null +++ b/model-00151-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e02c1f999a06e781e7f4e41b0bdb983ec3c14c602d3513b2e6b9a6cb2c7d58b0 +size 8602554416 diff --git a/model-00152-of-000163.safetensors b/model-00152-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8e7bb6c901f256ba1a76ca9149eb90cfab5262d0 --- /dev/null +++ b/model-00152-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2422ee011f797cf4b376fc3bcd2d0a0291831abfc226bac53e62d9e45174bf30 +size 8598786704 diff --git a/model-00154-of-000163.safetensors b/model-00154-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..50f32f78343b2b674b83681771d122e21c728524 --- /dev/null +++ b/model-00154-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63afe37ed22260faa77c4c05d3ea23e965050ab8d57932edd082c78a316741a8 +size 8602554448 diff --git a/model-00155-of-000163.safetensors b/model-00155-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..66e3d61f5639254cc38628e1cf708857e8e738bc --- /dev/null +++ b/model-00155-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65daaae1c42804f406247e7dd999110bd08e141ceb7bd4f7a9f88a1c69ebf1d7 +size 8598786616 diff --git a/model-00156-of-000163.safetensors b/model-00156-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e58b2755224bf91cdb952e7f4251f7d0667a98f6 --- /dev/null +++ b/model-00156-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3be755be1a4d498a4de8c0009a3ab02b6e04a64eb337bca68137dcbd7ef27b44 +size 8602554312 diff --git a/model-00157-of-000163.safetensors b/model-00157-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..032f820b392f16c0cb66639bac560650b850c9c3 --- /dev/null +++ b/model-00157-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b52539cbf89b3a1650f54ea5cc5da509bc8d32dc7a3e9a7d20509dc4737a00f +size 8602554448 diff --git a/model-00158-of-000163.safetensors b/model-00158-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..971676700adf7dc37393a50d4c0421039f262075 --- /dev/null +++ b/model-00158-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f3b6a25e26237b651efa5c3b92ffcec3231210b016a239b20a1774a401474ab +size 8598786520 diff --git a/model-00159-of-000163.safetensors b/model-00159-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5c1fd9b18f5a25a9153e0826132d827396699581 --- /dev/null +++ b/model-00159-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b1b915bbf3ce29e8ab0742990b776aa483c37bf17250aa993ea4dd926f11c60 +size 8602554408 diff --git a/model-00160-of-000163.safetensors b/model-00160-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..beea0651e0f420c1ad4d1ccbe868ac521919ab1d --- /dev/null +++ b/model-00160-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99d8659457b0422e066c00cc7923c44053eb183a82c921109f7decd1567abaff +size 8602463472 diff --git a/model-00161-of-000163.safetensors b/model-00161-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1dd891f584e1a49fa4b27480d4edb48f6fd9360e --- /dev/null +++ b/model-00161-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cb2dbcb055efe70cf541bc94ea6c0d70778bcfc175a532642eaec867b4455de +size 8602554128 diff --git a/model-00162-of-000163.safetensors b/model-00162-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..697a77d261608228ecf3864aa5491c629467ab7c --- /dev/null +++ b/model-00162-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44ca50d7d731f62b5cb4863c3f480f1041b88101da5db8405608a285a2a6fd5a +size 8602554440 diff --git a/model.safetensors.index.json b/model.safetensors.index.json new file mode 100644 index 0000000000000000000000000000000000000000..5b60276c1efb766f6a1aee2e357e27407f6ed12b --- /dev/null +++ b/model.safetensors.index.json @@ -0,0 +1,46188 @@ +{ + "metadata": {}, + "weight_map": { + "model.embed_tokens.weight": "model-00001-of-000163.safetensors", + "model.layers.0.self_attn.q_a_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.0.self_attn.q_a_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.0.self_attn.q_b_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.0.self_attn.kv_a_proj_with_mqa.weight": "model-00001-of-000163.safetensors", + "model.layers.0.self_attn.kv_a_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.0.self_attn.kv_b_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.0.self_attn.o_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.0.mlp.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.0.mlp.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.0.mlp.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.0.input_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.0.post_attention_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.1.self_attn.q_a_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.1.self_attn.q_a_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.1.self_attn.q_b_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.1.self_attn.kv_a_proj_with_mqa.weight": "model-00001-of-000163.safetensors", + "model.layers.1.self_attn.kv_a_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.1.self_attn.kv_b_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.1.self_attn.o_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.1.mlp.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.1.mlp.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.1.mlp.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.1.input_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.1.post_attention_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.2.self_attn.q_a_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.2.self_attn.q_a_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.2.self_attn.q_b_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.2.self_attn.kv_a_proj_with_mqa.weight": "model-00001-of-000163.safetensors", + "model.layers.2.self_attn.kv_a_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.2.self_attn.kv_b_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.2.self_attn.o_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.2.mlp.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.2.mlp.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.2.mlp.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.2.input_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.2.post_attention_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.3.self_attn.q_a_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.self_attn.q_a_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.3.self_attn.q_b_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.self_attn.kv_a_proj_with_mqa.weight": "model-00001-of-000163.safetensors", + "model.layers.3.self_attn.kv_a_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.3.self_attn.kv_b_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.self_attn.o_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.gate.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.gate.e_score_correction_bias": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.shared_experts.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.shared_experts.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.shared_experts.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.0.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.0.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.0.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.1.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.1.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.1.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.2.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.2.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.2.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.3.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.3.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.3.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.4.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.4.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.4.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.5.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.5.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.5.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.6.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.6.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.6.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.7.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.7.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.7.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.8.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.8.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.8.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.9.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.9.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.9.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.10.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.10.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.10.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.11.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.11.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.11.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.12.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.12.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.12.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.13.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.13.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.13.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.14.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.14.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.14.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.15.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.15.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.15.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.16.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.16.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.16.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.17.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.17.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.17.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.18.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.18.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.18.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.19.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.19.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.19.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.20.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.20.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.20.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.21.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.21.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.21.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.22.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.22.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.22.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.23.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.23.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.23.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.24.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.24.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.24.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.25.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.25.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.25.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.26.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.26.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.26.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.27.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.27.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.27.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.28.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.28.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.28.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.29.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.29.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.29.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.30.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.30.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.30.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.31.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.31.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.31.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.32.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.32.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.32.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.33.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.33.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.33.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.34.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.34.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.34.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.35.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.35.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.35.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.36.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.36.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.36.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.37.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.37.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.37.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.38.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.38.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.38.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.39.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.39.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.39.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.40.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.40.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.40.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.41.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.41.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.41.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.42.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.42.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.42.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.43.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.43.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.43.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.44.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.44.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.44.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.45.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.45.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.45.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.46.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.46.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.46.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.47.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.47.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.47.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.48.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.48.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.48.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.49.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.49.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.49.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.50.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.50.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.50.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.51.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.51.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.51.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.52.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.52.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.52.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.53.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.53.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.53.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.54.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.54.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.54.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.55.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.55.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.55.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.56.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.56.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.56.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.57.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.57.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.57.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.58.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.58.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.58.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.59.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.59.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.59.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.60.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.60.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.60.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.61.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.61.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.61.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.62.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.62.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.62.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.63.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.63.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.63.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.64.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.64.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.64.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.65.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.65.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.65.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.66.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.66.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.66.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.67.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.67.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.67.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.68.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.68.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.68.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.69.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.69.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.69.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.70.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.70.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.70.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.71.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.71.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.71.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.72.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.72.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.72.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.73.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.73.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.73.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.74.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.74.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.74.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.75.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.75.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.75.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.76.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.76.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.76.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.77.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.77.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.77.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.78.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.78.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.78.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.79.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.79.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.79.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.80.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.80.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.80.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.81.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.81.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.81.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.82.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.82.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.82.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.83.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.83.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.83.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.84.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.84.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.84.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.85.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.85.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.85.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.86.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.86.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.86.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.87.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.87.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.87.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.88.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.88.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.88.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.89.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.89.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.89.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.90.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.90.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.90.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.91.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.91.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.91.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.92.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.92.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.92.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.93.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.93.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.93.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.94.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.94.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.94.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.95.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.95.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.95.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.96.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.96.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.96.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.97.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.97.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.97.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.98.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.98.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.98.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.99.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.99.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.99.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.100.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.100.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.100.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.101.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.101.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.101.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.102.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.102.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.102.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.103.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.103.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.103.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.104.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.104.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.104.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.105.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.105.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.105.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.106.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.106.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.106.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.107.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.107.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.107.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.108.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.108.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.108.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.109.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.109.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.109.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.110.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.110.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.110.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.111.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.111.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.111.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.112.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.112.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.112.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.113.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.113.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.113.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.114.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.114.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.114.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.115.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.115.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.115.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.116.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.116.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.116.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.117.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.117.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.117.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.118.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.118.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.118.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.119.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.119.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.119.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.120.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.120.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.120.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.121.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.121.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.121.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.122.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.122.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.122.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.123.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.123.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.123.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.124.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.124.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.124.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.125.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.125.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.125.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.126.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.126.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.126.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.127.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.127.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.127.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.128.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.128.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.128.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.129.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.129.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.129.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.130.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.130.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.130.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.131.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.131.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.131.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.132.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.132.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.132.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.133.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.133.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.133.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.134.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.134.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.134.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.135.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.135.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.135.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.136.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.136.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.136.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.137.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.137.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.137.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.138.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.138.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.138.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.139.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.139.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.139.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.140.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.140.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.140.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.141.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.141.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.141.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.142.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.142.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.142.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.143.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.143.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.143.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.144.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.144.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.144.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.145.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.145.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.145.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.146.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.146.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.146.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.147.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.147.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.147.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.148.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.148.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.148.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.149.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.149.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.149.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.150.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.150.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.150.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.151.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.151.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.151.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.152.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.152.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.152.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.153.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.153.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.153.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.154.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.154.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.154.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.155.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.155.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.155.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.156.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.156.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.156.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.157.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.157.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.157.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.158.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.158.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.158.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.159.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.159.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.159.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.160.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.160.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.160.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.161.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.161.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.161.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.162.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.162.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.162.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.163.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.163.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.163.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.164.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.164.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.164.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.165.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.165.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.165.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.166.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.166.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.166.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.167.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.167.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.167.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.168.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.168.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.168.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.169.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.169.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.169.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.170.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.170.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.170.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.171.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.171.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.171.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.172.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.172.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.172.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.173.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.173.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.173.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.174.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.174.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.174.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.175.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.175.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.175.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.176.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.176.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.176.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.177.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.177.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.177.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.178.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.178.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.178.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.179.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.179.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.179.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.180.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.180.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.180.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.181.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.181.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.181.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.182.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.182.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.182.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.183.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.183.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.183.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.184.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.184.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.184.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.185.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.185.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.185.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.186.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.186.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.186.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.187.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.187.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.187.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.188.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.188.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.188.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.189.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.189.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.189.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.190.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.190.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.190.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.191.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.191.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.191.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.192.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.192.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.192.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.193.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.193.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.193.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.194.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.194.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.194.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.195.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.195.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.195.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.196.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.196.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.196.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.197.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.197.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.197.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.198.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.198.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.198.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.199.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.199.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.199.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.200.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.200.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.200.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.201.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.201.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.201.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.202.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.202.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.202.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.203.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.203.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.203.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.204.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.204.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.204.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.205.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.205.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.205.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.206.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.206.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.206.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.207.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.207.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.207.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.208.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.208.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.208.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.209.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.209.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.209.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.210.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.210.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.210.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.211.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.211.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.211.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.212.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.212.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.212.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.213.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.213.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.213.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.214.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.214.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.214.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.215.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.215.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.215.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.216.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.216.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.216.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.217.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.217.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.217.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.218.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.218.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.218.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.219.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.219.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.219.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.220.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.220.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.220.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.221.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.221.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.221.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.222.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.222.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.222.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.223.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.223.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.223.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.224.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.224.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.224.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.225.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.225.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.225.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.226.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.226.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.226.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.227.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.227.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.227.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.228.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.228.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.228.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.229.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.229.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.229.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.230.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.230.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.230.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.231.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.231.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.231.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.232.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.232.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.232.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.233.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.233.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.233.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.234.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.234.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.234.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.235.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.235.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.235.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.236.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.236.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.236.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.237.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.237.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.237.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.238.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.238.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.238.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.239.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.239.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.239.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.240.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.240.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.240.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.241.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.241.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.241.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.242.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.242.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.242.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.243.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.243.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.243.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.244.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.244.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.244.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.245.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.245.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.245.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.246.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.246.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.246.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.247.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.247.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.247.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.248.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.248.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.248.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.249.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.249.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.249.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.250.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.250.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.250.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.251.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.251.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.251.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.252.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.252.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.252.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.253.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.253.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.253.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.254.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.254.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.254.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.255.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.255.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.255.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.input_layernorm.weight": "model-00004-of-000163.safetensors", + "model.layers.3.post_attention_layernorm.weight": "model-00004-of-000163.safetensors", + "model.layers.4.self_attn.q_a_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.self_attn.q_a_layernorm.weight": "model-00004-of-000163.safetensors", + "model.layers.4.self_attn.q_b_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.self_attn.kv_a_proj_with_mqa.weight": "model-00004-of-000163.safetensors", + "model.layers.4.self_attn.kv_a_layernorm.weight": "model-00004-of-000163.safetensors", + "model.layers.4.self_attn.kv_b_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.self_attn.o_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.gate.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.gate.e_score_correction_bias": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.shared_experts.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.shared_experts.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.shared_experts.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.0.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.0.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.0.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.1.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.1.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.1.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.2.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.2.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.2.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.3.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.3.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.3.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.4.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.4.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.4.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.5.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.5.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.5.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.6.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.6.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.6.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.7.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.7.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.7.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.8.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.8.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.8.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.9.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.9.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.9.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.10.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.10.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.10.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.11.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.11.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.11.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.12.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.12.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.12.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.13.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.13.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.13.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.14.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.14.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.14.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.15.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.15.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.15.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.16.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.16.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.16.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.17.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.17.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.17.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.18.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.18.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.18.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.19.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.19.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.19.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.20.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.20.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.20.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.21.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.21.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.21.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.22.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.22.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.22.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.23.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.23.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.23.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.24.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.24.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.24.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.25.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.25.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.25.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.26.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.26.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.26.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.27.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.27.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.27.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.28.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.28.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.28.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.29.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.29.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.29.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.30.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.30.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.30.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.31.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.31.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.31.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.32.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.32.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.32.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.33.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.33.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.33.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.34.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.34.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.34.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.35.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.35.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.35.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.36.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.36.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.36.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.37.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.37.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.37.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.38.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.38.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.38.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.39.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.39.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.39.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.40.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.40.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.40.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.41.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.41.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.41.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.42.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.42.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.42.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.43.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.43.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.43.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.44.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.44.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.44.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.45.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.45.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.45.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.46.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.46.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.46.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.47.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.47.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.47.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.48.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.48.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.48.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.49.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.49.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.49.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.50.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.50.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.50.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.51.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.51.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.51.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.52.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.52.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.52.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.53.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.53.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.53.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.54.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.54.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.54.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.55.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.55.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.55.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.56.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.56.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.56.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.57.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.57.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.57.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.58.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.58.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.58.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.59.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.59.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.59.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.60.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.60.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.60.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.61.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.61.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.61.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.62.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.62.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.62.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.63.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.63.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.63.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.64.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.64.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.64.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.65.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.65.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.65.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.66.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.66.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.66.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.67.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.67.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.67.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.68.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.68.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.68.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.69.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.69.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.69.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.70.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.70.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.70.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.71.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.71.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.71.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.72.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.72.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.72.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.73.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.73.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.73.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.74.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.74.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.74.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.75.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.75.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.75.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.76.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.76.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.76.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.77.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.77.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.77.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.78.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.78.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.78.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.79.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.79.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.79.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.80.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.80.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.80.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.81.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.81.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.81.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.82.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.82.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.82.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.83.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.83.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.83.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.84.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.84.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.84.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.85.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.85.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.85.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.86.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.86.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.86.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.87.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.87.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.87.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.88.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.88.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.88.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.89.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.89.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.89.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.90.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.90.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.90.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.91.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.91.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.91.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.92.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.92.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.92.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.93.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.93.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.93.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.94.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.94.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.94.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.95.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.95.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.95.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.96.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.96.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.96.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.97.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.97.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.97.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.98.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.98.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.98.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.99.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.99.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.99.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.100.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.100.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.100.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.101.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.101.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.101.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.102.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.102.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.102.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.103.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.103.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.103.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.104.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.104.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.104.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.105.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.105.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.105.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.106.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.106.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.106.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.107.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.107.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.107.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.108.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.108.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.108.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.109.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.109.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.109.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.110.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.110.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.110.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.111.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.111.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.111.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.112.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.112.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.112.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.113.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.113.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.113.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.114.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.114.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.114.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.115.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.115.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.115.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.116.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.116.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.116.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.117.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.117.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.117.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.118.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.118.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.118.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.119.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.119.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.119.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.120.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.120.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.120.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.121.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.121.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.121.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.122.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.122.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.122.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.123.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.123.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.123.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.124.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.124.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.124.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.125.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.125.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.125.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.126.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.126.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.126.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.127.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.127.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.127.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.128.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.128.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.128.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.129.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.129.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.129.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.130.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.130.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.130.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.131.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.131.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.131.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.132.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.132.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.132.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.133.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.133.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.133.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.134.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.134.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.134.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.135.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.135.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.135.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.136.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.136.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.136.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.137.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.137.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.137.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.138.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.138.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.138.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.139.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.139.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.139.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.140.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.140.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.140.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.141.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.141.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.141.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.142.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.142.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.142.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.143.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.143.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.143.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.144.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.144.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.144.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.145.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.145.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.145.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.146.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.146.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.146.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.147.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.147.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.147.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.148.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.148.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.148.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.149.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.149.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.149.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.150.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.150.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.150.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.151.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.151.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.151.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.152.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.152.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.152.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.153.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.153.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.153.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.154.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.154.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.154.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.155.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.155.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.155.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.156.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.156.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.156.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.157.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.157.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.157.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.158.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.158.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.158.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.159.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.159.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.159.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.160.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.160.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.160.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.161.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.161.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.161.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.162.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.162.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.162.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.163.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.163.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.163.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.164.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.164.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.164.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.165.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.165.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.165.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.166.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.166.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.166.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.167.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.167.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.167.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.168.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.168.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.168.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.169.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.169.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.169.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.170.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.170.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.170.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.171.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.171.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.171.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.172.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.172.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.172.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.173.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.173.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.173.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.174.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.174.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.174.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.175.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.175.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.175.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.176.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.176.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.176.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.177.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.177.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.177.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.178.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.178.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.178.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.179.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.179.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.179.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.180.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.180.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.180.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.181.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.181.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.181.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.182.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.182.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.182.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.183.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.183.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.183.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.184.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.184.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.184.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.185.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.185.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.185.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.186.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.186.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.186.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.187.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.187.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.187.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.188.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.188.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.188.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.189.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.189.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.189.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.190.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.190.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.190.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.191.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.191.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.191.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.192.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.192.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.192.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.193.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.193.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.193.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.194.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.194.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.194.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.195.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.195.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.195.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.196.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.196.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.196.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.197.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.197.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.197.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.198.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.198.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.198.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.199.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.199.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.199.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.200.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.200.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.200.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.201.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.201.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.201.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.202.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.202.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.202.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.203.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.203.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.203.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.204.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.204.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.204.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.205.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.205.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.205.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.206.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.206.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.206.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.207.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.207.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.207.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.208.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.208.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.208.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.209.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.209.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.209.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.210.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.210.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.210.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.211.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.211.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.211.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.212.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.212.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.212.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.213.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.213.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.213.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.214.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.214.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.214.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.215.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.215.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.215.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.216.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.216.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.216.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.217.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.217.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.217.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.218.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.218.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.218.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.219.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.219.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.219.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.220.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.220.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.220.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.221.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.221.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.221.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.222.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.222.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.222.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.223.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.223.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.223.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.224.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.224.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.224.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.225.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.225.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.225.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.226.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.226.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.226.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.227.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.227.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.227.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.228.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.228.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.228.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.229.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.229.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.229.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.230.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.230.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.230.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.231.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.231.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.231.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.232.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.232.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.232.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.233.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.233.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.233.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.234.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.234.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.234.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.235.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.235.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.235.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.236.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.236.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.236.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.237.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.237.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.237.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.238.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.238.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.238.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.239.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.239.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.239.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.240.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.240.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.240.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.241.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.241.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.241.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.242.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.242.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.242.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.243.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.243.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.243.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.244.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.244.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.244.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.245.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.245.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.245.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.246.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.246.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.246.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.247.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.247.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.247.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.248.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.248.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.248.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.249.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.249.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.249.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.250.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.250.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.250.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.251.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.251.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.251.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.252.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.252.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.252.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.253.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.253.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.253.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.254.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.254.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.254.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.255.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.255.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.255.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.input_layernorm.weight": "model-00006-of-000163.safetensors", + "model.layers.4.post_attention_layernorm.weight": "model-00006-of-000163.safetensors", + "model.layers.5.self_attn.q_a_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.5.self_attn.q_a_layernorm.weight": "model-00006-of-000163.safetensors", + "model.layers.5.self_attn.q_b_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.5.self_attn.kv_a_proj_with_mqa.weight": "model-00006-of-000163.safetensors", + "model.layers.5.self_attn.kv_a_layernorm.weight": "model-00006-of-000163.safetensors", + "model.layers.5.self_attn.kv_b_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.5.self_attn.o_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.5.mlp.gate.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.gate.e_score_correction_bias": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.shared_experts.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.shared_experts.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.shared_experts.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.0.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.0.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.0.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.1.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.1.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.1.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.2.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.2.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.2.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.3.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.3.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.3.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.4.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.4.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.4.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.5.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.5.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.5.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.6.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.6.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.6.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.7.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.7.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.7.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.8.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.8.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.8.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.9.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.9.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.9.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.10.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.10.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.10.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.11.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.11.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.11.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.12.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.12.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.12.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.13.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.13.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.13.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.14.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.14.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.14.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.15.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.15.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.15.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.16.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.16.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.16.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.17.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.17.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.17.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.18.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.18.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.18.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.19.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.19.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.19.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.20.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.20.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.20.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.21.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.21.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.21.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.22.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.22.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.22.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.23.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.23.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.23.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.24.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.24.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.24.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.25.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.25.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.25.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.26.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.26.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.26.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.27.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.27.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.27.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.28.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.28.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.28.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.29.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.29.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.29.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.30.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.30.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.30.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.31.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.31.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.31.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.32.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.32.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.32.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.33.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.33.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.33.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.34.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.34.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.34.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.35.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.35.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.35.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.36.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.36.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.36.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.37.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.37.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.37.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.38.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.38.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.38.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.39.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.39.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.39.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.40.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.40.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.40.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.41.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.41.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.41.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.42.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.42.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.42.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.43.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.43.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.43.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.44.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.44.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.44.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.45.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.45.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.45.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.46.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.46.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.46.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.47.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.47.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.47.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.48.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.48.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.48.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.49.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.49.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.49.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.50.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.50.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.50.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.51.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.51.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.51.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.52.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.52.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.52.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.53.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.53.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.53.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.54.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.54.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.54.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.55.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.55.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.55.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.56.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.56.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.56.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.57.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.57.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.57.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.58.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.58.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.58.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.59.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.59.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.59.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.60.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.60.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.60.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.61.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.61.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.61.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.62.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.62.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.62.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.63.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.63.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.63.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.64.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.64.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.64.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.65.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.65.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.65.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.66.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.66.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.66.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.67.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.67.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.67.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.68.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.68.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.68.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.69.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.69.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.69.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.70.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.70.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.70.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.71.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.71.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.71.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.72.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.72.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.72.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.73.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.73.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.73.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.74.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.74.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.74.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.75.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.75.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.75.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.76.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.76.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.76.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.77.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.77.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.77.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.78.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.78.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.78.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.79.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.79.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.79.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.80.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.80.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.80.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.81.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.81.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.81.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.82.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.82.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.82.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.83.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.83.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.83.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.84.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.84.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.84.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.85.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.85.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.85.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.86.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.86.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.86.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.87.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.87.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.87.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.88.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.88.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.88.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.89.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.89.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.89.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.90.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.90.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.90.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.91.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.91.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.91.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.92.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.92.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.92.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.93.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.93.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.93.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.94.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.94.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.94.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.95.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.95.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.95.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.96.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.96.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.96.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.97.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.97.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.97.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.98.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.98.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.98.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.99.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.99.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.99.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.100.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.100.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.100.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.101.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.101.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.101.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.102.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.102.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.102.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.103.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.103.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.103.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.104.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.104.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.104.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.105.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.105.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.105.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.106.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.106.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.106.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.107.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.107.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.107.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.108.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.108.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.108.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.109.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.109.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.109.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.110.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.110.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.110.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.111.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.111.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.111.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.112.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.112.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.112.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.113.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.113.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.113.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.114.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.114.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.114.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.115.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.115.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.115.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.116.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.116.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.116.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.117.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.117.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.117.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.118.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.118.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.118.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.119.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.119.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.119.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.120.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.120.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.120.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.121.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.121.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.121.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.122.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.122.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.122.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.123.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.123.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.123.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.124.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.124.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.124.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.125.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.125.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.125.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.126.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.126.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.126.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.127.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.127.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.127.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.128.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.128.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.128.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.129.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.129.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.129.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.130.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.130.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.130.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.131.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.131.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.131.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.132.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.132.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.132.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.133.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.133.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.133.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.134.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.134.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.134.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.135.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.135.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.135.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.136.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.136.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.136.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.137.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.137.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.137.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.138.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.138.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.138.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.139.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.139.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.139.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.140.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.140.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.140.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.141.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.141.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.141.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.142.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.142.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.142.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.143.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.143.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.143.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.144.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.144.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.144.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.145.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.145.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.145.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.146.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.146.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.146.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.147.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.147.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.147.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.148.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.148.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.148.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.149.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.149.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.149.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.150.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.150.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.150.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.151.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.151.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.151.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.152.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.152.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.152.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.153.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.153.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.153.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.154.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.154.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.154.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.155.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.155.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.155.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.156.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.156.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.156.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.157.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.157.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.157.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.158.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.158.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.158.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.159.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.159.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.159.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.160.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.160.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.160.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.161.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.161.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.161.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.162.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.162.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.162.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.163.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.163.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.163.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.164.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.164.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.164.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.165.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.165.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.165.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.166.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.166.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.166.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.167.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.167.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.167.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.168.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.168.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.168.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.169.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.169.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.169.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.170.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.170.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.170.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.171.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.171.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.171.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.172.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.172.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.172.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.173.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.173.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.173.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.174.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.174.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.174.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.175.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.175.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.175.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.176.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.176.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.176.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.177.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.177.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.177.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.178.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.178.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.178.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.179.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.179.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.179.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.180.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.180.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.180.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.181.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.181.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.181.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.182.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.182.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.182.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.183.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.183.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.183.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.184.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.184.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.184.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.185.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.185.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.185.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.186.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.186.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.186.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.187.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.187.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.187.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.188.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.188.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.188.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.189.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.189.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.189.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.190.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.190.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.190.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.191.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.191.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.191.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.192.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.192.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.192.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.193.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.193.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.193.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.194.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.194.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.194.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.195.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.195.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.195.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.196.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.196.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.196.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.197.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.197.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.197.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.198.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.198.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.198.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.199.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.199.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.199.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.200.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.200.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.200.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.201.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.201.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.201.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.202.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.202.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.202.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.203.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.203.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.203.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.204.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.204.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.204.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.205.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.205.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.205.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.206.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.206.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.206.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.207.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.207.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.207.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.208.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.208.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.208.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.209.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.209.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.209.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.210.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.210.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.210.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.211.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.211.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.211.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.212.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.212.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.212.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.213.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.213.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.213.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.214.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.214.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.214.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.215.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.215.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.215.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.216.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.216.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.216.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.217.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.217.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.217.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.218.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.218.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.218.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.219.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.219.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.219.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.220.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.220.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.220.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.221.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.221.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.221.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.222.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.222.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.222.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.223.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.223.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.223.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.224.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.224.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.224.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.225.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.225.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.225.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.226.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.226.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.226.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.227.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.227.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.227.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.228.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.228.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.228.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.229.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.229.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.229.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.230.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.230.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.230.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.231.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.231.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.231.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.232.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.232.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.232.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.233.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.233.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.233.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.234.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.234.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.234.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.235.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.235.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.235.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.236.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.236.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.236.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.237.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.237.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.237.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.238.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.238.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.238.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.239.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.239.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.239.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.240.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.240.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.240.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.241.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.241.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.241.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.242.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.242.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.242.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.243.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.243.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.243.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.244.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.244.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.244.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.245.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.245.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.245.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.246.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.246.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.246.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.247.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.247.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.247.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.248.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.248.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.248.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.249.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.249.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.249.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.250.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.250.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.250.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.251.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.251.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.251.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.252.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.252.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.252.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.253.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.253.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.253.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.254.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.254.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.254.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.255.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.255.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.255.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.input_layernorm.weight": "model-00009-of-000163.safetensors", + "model.layers.5.post_attention_layernorm.weight": "model-00009-of-000163.safetensors", + "model.layers.6.self_attn.q_a_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.self_attn.q_a_layernorm.weight": "model-00009-of-000163.safetensors", + "model.layers.6.self_attn.q_b_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.self_attn.kv_a_proj_with_mqa.weight": "model-00009-of-000163.safetensors", + "model.layers.6.self_attn.kv_a_layernorm.weight": "model-00009-of-000163.safetensors", + "model.layers.6.self_attn.kv_b_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.self_attn.o_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.gate.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.gate.e_score_correction_bias": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.shared_experts.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.shared_experts.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.shared_experts.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.0.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.0.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.0.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.1.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.1.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.1.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.2.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.2.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.2.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.3.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.3.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.3.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.4.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.4.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.4.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.5.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.5.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.5.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.6.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.6.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.6.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.7.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.7.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.7.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.8.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.8.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.8.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.9.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.9.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.9.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.10.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.10.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.10.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.11.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.11.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.11.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.12.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.12.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.12.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.13.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.13.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.13.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.14.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.14.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.14.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.15.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.15.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.15.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.16.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.16.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.16.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.17.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.17.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.17.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.18.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.18.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.18.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.19.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.19.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.19.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.20.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.20.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.20.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.21.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.21.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.21.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.22.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.22.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.22.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.23.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.23.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.23.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.24.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.24.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.24.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.25.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.25.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.25.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.26.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.26.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.26.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.27.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.27.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.27.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.28.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.28.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.28.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.29.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.29.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.29.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.30.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.30.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.30.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.31.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.31.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.31.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.32.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.32.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.32.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.33.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.33.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.33.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.34.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.34.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.34.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.35.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.35.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.35.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.36.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.36.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.36.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.37.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.37.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.37.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.38.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.38.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.38.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.39.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.39.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.39.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.40.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.40.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.40.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.41.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.41.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.41.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.42.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.42.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.42.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.43.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.43.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.43.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.44.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.44.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.44.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.45.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.45.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.45.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.46.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.46.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.46.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.47.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.47.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.47.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.48.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.48.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.48.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.49.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.49.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.49.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.50.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.50.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.50.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.51.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.51.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.51.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.52.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.52.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.52.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.53.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.53.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.53.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.54.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.54.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.54.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.55.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.55.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.55.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.56.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.56.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.56.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.57.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.57.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.57.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.58.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.58.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.58.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.59.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.59.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.59.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.60.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.60.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.60.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.61.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.61.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.61.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.62.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.62.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.62.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.63.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.63.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.63.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.64.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.64.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.64.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.65.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.65.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.65.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.66.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.66.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.66.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.67.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.67.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.67.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.68.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.68.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.68.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.69.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.69.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.69.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.70.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.70.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.70.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.71.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.71.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.71.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.72.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.72.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.72.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.73.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.73.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.73.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.74.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.74.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.74.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.75.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.75.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.75.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.76.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.76.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.76.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.77.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.77.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.77.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.78.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.78.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.78.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.79.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.79.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.79.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.80.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.80.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.80.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.81.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.81.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.81.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.82.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.82.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.82.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.83.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.83.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.83.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.84.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.84.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.84.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.85.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.85.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.85.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.86.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.86.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.86.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.87.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.87.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.87.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.88.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.88.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.88.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.89.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.89.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.89.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.90.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.90.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.90.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.91.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.91.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.91.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.92.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.92.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.92.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.93.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.93.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.93.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.94.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.94.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.94.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.95.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.95.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.95.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.96.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.96.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.96.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.97.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.97.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.97.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.98.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.98.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.98.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.99.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.99.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.99.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.100.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.100.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.100.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.101.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.101.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.101.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.102.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.102.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.102.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.103.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.103.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.103.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.104.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.104.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.104.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.105.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.105.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.105.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.106.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.106.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.106.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.107.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.107.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.107.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.108.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.108.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.108.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.109.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.109.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.109.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.110.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.110.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.110.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.111.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.111.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.111.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.112.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.112.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.112.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.113.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.113.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.113.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.114.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.114.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.114.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.115.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.115.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.115.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.116.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.116.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.116.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.117.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.117.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.117.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.118.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.118.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.118.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.119.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.119.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.119.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.120.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.120.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.120.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.121.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.121.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.121.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.122.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.122.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.122.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.123.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.123.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.123.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.124.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.124.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.124.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.125.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.125.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.125.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.126.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.126.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.126.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.127.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.127.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.127.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.128.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.128.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.128.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.129.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.129.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.129.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.130.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.130.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.130.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.131.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.131.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.131.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.132.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.132.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.132.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.133.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.133.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.133.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.134.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.134.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.134.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.135.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.135.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.135.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.136.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.136.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.136.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.137.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.137.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.137.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.138.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.138.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.138.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.139.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.139.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.139.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.140.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.140.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.140.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.141.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.141.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.141.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.142.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.142.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.142.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.143.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.143.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.143.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.144.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.144.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.144.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.145.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.145.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.145.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.146.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.146.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.146.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.147.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.147.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.147.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.148.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.148.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.148.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.149.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.149.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.149.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.150.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.150.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.150.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.151.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.151.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.151.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.152.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.152.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.152.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.153.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.153.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.153.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.154.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.154.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.154.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.155.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.155.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.155.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.156.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.156.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.156.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.157.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.157.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.157.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.158.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.158.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.158.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.159.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.159.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.159.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.160.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.160.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.160.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.161.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.161.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.161.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.162.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.162.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.162.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.163.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.163.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.163.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.164.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.164.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.164.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.165.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.165.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.165.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.166.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.166.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.166.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.167.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.167.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.167.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.168.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.168.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.168.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.169.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.169.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.169.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.170.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.170.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.170.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.171.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.171.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.171.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.172.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.172.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.172.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.173.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.173.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.173.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.174.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.174.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.174.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.175.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.175.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.175.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.176.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.176.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.176.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.177.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.177.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.177.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.178.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.178.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.178.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.179.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.179.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.179.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.180.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.180.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.180.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.181.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.181.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.181.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.182.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.182.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.182.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.183.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.183.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.183.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.184.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.184.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.184.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.185.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.185.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.185.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.186.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.186.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.186.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.187.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.187.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.187.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.188.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.188.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.188.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.189.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.189.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.189.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.190.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.190.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.190.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.191.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.191.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.191.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.192.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.192.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.192.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.193.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.193.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.193.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.194.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.194.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.194.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.195.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.195.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.195.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.196.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.196.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.196.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.197.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.197.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.197.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.198.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.198.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.198.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.199.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.199.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.199.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.200.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.200.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.200.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.201.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.201.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.201.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.202.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.202.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.202.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.203.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.203.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.203.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.204.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.204.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.204.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.205.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.205.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.205.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.206.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.206.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.206.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.207.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.207.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.207.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.208.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.208.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.208.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.209.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.209.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.209.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.210.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.210.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.210.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.211.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.211.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.211.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.212.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.212.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.212.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.213.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.213.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.213.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.214.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.214.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.214.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.215.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.215.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.215.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.216.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.216.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.216.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.217.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.217.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.217.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.218.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.218.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.218.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.219.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.219.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.219.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.220.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.220.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.220.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.221.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.221.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.221.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.222.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.222.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.222.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.223.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.223.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.223.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.224.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.224.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.224.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.225.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.225.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.225.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.226.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.226.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.226.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.227.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.227.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.227.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.228.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.228.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.228.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.229.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.229.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.229.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.230.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.230.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.230.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.231.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.231.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.231.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.232.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.232.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.232.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.233.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.233.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.233.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.234.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.234.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.234.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.235.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.235.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.235.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.236.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.236.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.236.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.237.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.237.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.237.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.238.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.238.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.238.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.239.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.239.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.239.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.240.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.240.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.240.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.241.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.241.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.241.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.242.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.242.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.242.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.243.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.243.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.243.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.244.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.244.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.244.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.245.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.245.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.245.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.246.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.246.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.246.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.247.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.247.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.247.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.248.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.248.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.248.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.249.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.249.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.249.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.250.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.250.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.250.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.251.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.251.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.251.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.252.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.252.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.252.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.253.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.253.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.253.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.254.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.254.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.254.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.255.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.255.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.255.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.input_layernorm.weight": "model-00012-of-000163.safetensors", + "model.layers.6.post_attention_layernorm.weight": "model-00012-of-000163.safetensors", + "model.layers.7.self_attn.q_a_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.self_attn.q_a_layernorm.weight": "model-00013-of-000163.safetensors", + "model.layers.7.self_attn.q_b_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.self_attn.kv_a_proj_with_mqa.weight": "model-00013-of-000163.safetensors", + "model.layers.7.self_attn.kv_a_layernorm.weight": "model-00013-of-000163.safetensors", + "model.layers.7.self_attn.kv_b_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.self_attn.o_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.gate.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.gate.e_score_correction_bias": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.shared_experts.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.shared_experts.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.shared_experts.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.0.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.0.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.0.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.1.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.1.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.1.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.2.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.2.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.2.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.3.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.3.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.3.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.4.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.4.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.4.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.5.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.5.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.5.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.6.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.6.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.6.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.7.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.7.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.7.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.8.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.8.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.8.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.9.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.9.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.9.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.10.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.10.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.10.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.11.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.11.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.11.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.12.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.12.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.12.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.13.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.13.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.13.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.14.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.14.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.14.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.15.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.15.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.15.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.16.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.16.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.16.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.17.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.17.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.17.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.18.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.18.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.18.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.19.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.19.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.19.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.20.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.20.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.20.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.21.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.21.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.21.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.22.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.22.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.22.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.23.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.23.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.23.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.24.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.24.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.24.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.25.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.25.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.25.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.26.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.26.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.26.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.27.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.27.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.27.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.28.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.28.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.28.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.29.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.29.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.29.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.30.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.30.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.30.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.31.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.31.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.31.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.32.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.32.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.32.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.33.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.33.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.33.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.34.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.34.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.34.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.35.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.35.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.35.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.36.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.36.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.36.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.37.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.37.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.37.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.38.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.38.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.38.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.39.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.39.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.39.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.40.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.40.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.40.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.41.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.41.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.41.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.42.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.42.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.42.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.43.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.43.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.43.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.44.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.44.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.44.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.45.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.45.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.45.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.46.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.46.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.46.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.47.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.47.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.47.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.48.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.48.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.48.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.49.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.49.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.49.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.50.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.50.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.50.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.51.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.51.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.51.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.52.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.52.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.52.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.53.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.53.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.53.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.54.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.54.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.54.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.55.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.55.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.55.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.56.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.56.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.56.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.57.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.57.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.57.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.58.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.58.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.58.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.59.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.59.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.59.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.60.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.60.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.60.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.61.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.61.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.61.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.62.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.62.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.62.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.63.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.63.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.63.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.64.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.64.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.64.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.65.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.65.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.65.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.66.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.66.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.66.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.67.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.67.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.67.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.68.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.68.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.68.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.69.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.69.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.69.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.70.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.70.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.70.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.71.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.71.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.71.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.72.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.72.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.72.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.73.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.73.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.73.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.74.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.74.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.74.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.75.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.75.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.75.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.76.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.76.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.76.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.77.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.77.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.77.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.78.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.78.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.78.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.79.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.79.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.79.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.80.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.80.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.80.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.81.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.81.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.81.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.82.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.82.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.82.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.83.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.83.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.83.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.84.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.84.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.84.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.85.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.85.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.85.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.86.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.86.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.86.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.87.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.87.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.87.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.88.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.88.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.88.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.89.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.89.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.89.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.90.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.90.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.90.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.91.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.91.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.91.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.92.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.92.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.92.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.93.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.93.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.93.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.94.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.94.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.94.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.95.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.95.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.95.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.96.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.96.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.96.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.97.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.97.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.97.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.98.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.98.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.98.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.99.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.99.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.99.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.100.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.100.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.100.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.101.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.101.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.101.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.102.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.102.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.102.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.103.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.103.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.103.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.104.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.104.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.104.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.105.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.105.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.105.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.106.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.106.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.106.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.107.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.107.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.107.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.108.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.108.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.108.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.109.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.109.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.109.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.110.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.110.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.110.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.111.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.111.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.111.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.112.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.112.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.112.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.113.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.113.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.113.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.114.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.114.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.114.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.115.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.115.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.115.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.116.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.116.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.116.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.117.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.117.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.117.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.118.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.118.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.118.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.119.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.119.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.119.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.120.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.120.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.120.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.121.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.121.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.121.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.122.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.122.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.122.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.123.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.123.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.123.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.124.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.124.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.124.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.125.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.125.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.125.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.126.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.126.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.126.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.127.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.127.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.127.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.128.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.128.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.128.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.129.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.129.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.129.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.130.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.130.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.130.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.131.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.131.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.131.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.132.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.132.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.132.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.133.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.133.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.133.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.134.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.134.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.134.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.135.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.135.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.135.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.136.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.136.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.136.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.137.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.137.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.137.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.138.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.138.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.138.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.139.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.139.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.139.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.140.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.140.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.140.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.141.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.141.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.141.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.142.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.142.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.142.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.143.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.143.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.143.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.144.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.144.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.144.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.145.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.145.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.145.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.146.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.146.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.146.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.147.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.147.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.147.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.148.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.148.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.148.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.149.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.149.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.149.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.150.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.150.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.150.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.151.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.151.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.151.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.152.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.152.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.152.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.153.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.153.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.153.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.154.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.154.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.154.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.155.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.155.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.155.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.156.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.156.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.156.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.157.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.157.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.157.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.158.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.158.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.158.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.159.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.159.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.159.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.160.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.160.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.160.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.161.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.161.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.161.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.162.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.162.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.162.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.163.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.163.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.163.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.164.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.164.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.164.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.165.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.165.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.165.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.166.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.166.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.166.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.167.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.167.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.167.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.168.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.168.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.168.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.169.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.169.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.169.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.170.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.170.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.170.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.171.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.171.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.171.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.172.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.172.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.172.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.173.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.173.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.173.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.174.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.174.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.174.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.175.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.175.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.175.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.176.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.176.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.176.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.177.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.177.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.177.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.178.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.178.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.178.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.179.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.179.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.179.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.180.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.180.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.180.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.181.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.181.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.181.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.182.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.182.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.182.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.183.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.183.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.183.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.184.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.184.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.184.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.185.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.185.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.185.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.186.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.186.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.186.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.187.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.187.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.187.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.188.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.188.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.188.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.189.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.189.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.189.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.190.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.190.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.190.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.191.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.191.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.191.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.192.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.192.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.192.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.193.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.193.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.193.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.194.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.194.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.194.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.195.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.195.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.195.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.196.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.196.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.196.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.197.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.197.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.197.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.198.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.198.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.198.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.199.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.199.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.199.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.200.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.200.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.200.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.201.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.201.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.201.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.202.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.202.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.202.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.203.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.203.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.203.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.204.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.204.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.204.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.205.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.205.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.205.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.206.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.206.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.206.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.207.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.207.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.207.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.208.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.208.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.208.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.209.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.209.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.209.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.210.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.210.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.210.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.211.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.211.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.211.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.212.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.212.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.212.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.213.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.213.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.213.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.214.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.214.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.214.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.215.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.215.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.215.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.216.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.216.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.216.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.217.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.217.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.217.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.218.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.218.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.218.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.219.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.219.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.219.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.220.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.220.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.220.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.221.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.221.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.221.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.222.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.222.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.222.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.223.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.223.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.223.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.224.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.224.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.224.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.225.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.225.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.225.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.226.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.226.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.226.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.227.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.227.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.227.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.228.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.228.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.228.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.229.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.229.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.229.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.230.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.230.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.230.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.231.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.231.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.231.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.232.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.232.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.232.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.233.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.233.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.233.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.234.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.234.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.234.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.235.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.235.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.235.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.236.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.236.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.236.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.237.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.237.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.237.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.238.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.238.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.238.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.239.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.239.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.239.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.240.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.240.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.240.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.241.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.241.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.241.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.242.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.242.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.242.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.243.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.243.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.243.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.244.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.244.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.244.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.245.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.245.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.245.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.246.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.246.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.246.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.247.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.247.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.247.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.248.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.248.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.248.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.249.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.249.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.249.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.250.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.250.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.250.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.251.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.251.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.251.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.252.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.252.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.252.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.253.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.253.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.253.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.254.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.254.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.254.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.255.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.255.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.255.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.input_layernorm.weight": "model-00015-of-000163.safetensors", + "model.layers.7.post_attention_layernorm.weight": "model-00015-of-000163.safetensors", + "model.layers.8.self_attn.q_a_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.self_attn.q_a_layernorm.weight": "model-00015-of-000163.safetensors", + "model.layers.8.self_attn.q_b_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.self_attn.kv_a_proj_with_mqa.weight": "model-00015-of-000163.safetensors", + "model.layers.8.self_attn.kv_a_layernorm.weight": "model-00015-of-000163.safetensors", + "model.layers.8.self_attn.kv_b_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.self_attn.o_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.gate.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.gate.e_score_correction_bias": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.shared_experts.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.shared_experts.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.shared_experts.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.0.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.0.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.0.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.1.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.1.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.1.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.2.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.2.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.2.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.3.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.3.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.3.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.4.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.4.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.4.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.5.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.5.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.5.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.6.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.6.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.6.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.7.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.7.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.7.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.8.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.8.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.8.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.9.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.9.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.9.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.10.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.10.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.10.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.11.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.11.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.11.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.12.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.12.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.12.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.13.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.13.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.13.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.14.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.14.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.14.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.15.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.15.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.15.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.16.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.16.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.16.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.17.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.17.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.17.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.18.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.18.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.18.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.19.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.19.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.19.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.20.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.20.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.20.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.21.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.21.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.21.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.22.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.22.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.22.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.23.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.23.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.23.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.24.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.24.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.24.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.25.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.25.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.25.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.26.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.26.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.26.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.27.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.27.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.27.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.28.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.28.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.28.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.29.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.29.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.29.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.30.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.30.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.30.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.31.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.31.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.31.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.32.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.32.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.32.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.33.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.33.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.33.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.34.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.34.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.34.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.35.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.35.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.35.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.36.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.36.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.36.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.37.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.37.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.37.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.38.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.38.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.38.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.39.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.39.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.39.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.40.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.40.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.40.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.41.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.41.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.41.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.42.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.42.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.42.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.43.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.43.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.43.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.44.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.44.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.44.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.45.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.45.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.45.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.46.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.46.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.46.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.47.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.47.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.47.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.48.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.48.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.48.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.49.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.49.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.49.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.50.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.50.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.50.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.51.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.51.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.51.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.52.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.52.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.52.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.53.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.53.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.53.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.54.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.54.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.54.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.55.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.55.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.55.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.56.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.56.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.56.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.57.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.57.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.57.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.58.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.58.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.58.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.59.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.59.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.59.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.60.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.60.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.60.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.61.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.61.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.61.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.62.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.62.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.62.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.63.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.63.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.63.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.64.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.64.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.64.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.65.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.65.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.65.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.66.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.66.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.66.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.67.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.67.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.67.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.68.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.68.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.68.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.69.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.69.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.69.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.70.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.70.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.70.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.71.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.71.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.71.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.72.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.72.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.72.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.73.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.73.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.73.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.74.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.74.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.74.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.75.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.75.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.75.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.76.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.76.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.76.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.77.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.77.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.77.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.78.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.78.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.78.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.79.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.79.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.79.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.80.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.80.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.80.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.81.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.81.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.81.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.82.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.82.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.82.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.83.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.83.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.83.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.84.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.84.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.84.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.85.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.85.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.85.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.86.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.86.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.86.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.87.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.87.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.87.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.88.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.88.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.88.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.89.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.89.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.89.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.90.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.90.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.90.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.91.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.91.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.91.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.92.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.92.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.92.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.93.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.93.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.93.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.94.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.94.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.94.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.95.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.95.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.95.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.96.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.96.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.96.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.97.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.97.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.97.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.98.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.98.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.98.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.99.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.99.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.99.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.100.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.100.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.100.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.101.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.101.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.101.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.102.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.102.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.102.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.103.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.103.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.103.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.104.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.104.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.104.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.105.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.105.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.105.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.106.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.106.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.106.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.107.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.107.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.107.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.108.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.108.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.108.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.109.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.109.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.109.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.110.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.110.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.110.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.111.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.111.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.111.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.112.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.112.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.112.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.113.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.113.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.113.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.114.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.114.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.114.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.115.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.115.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.115.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.116.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.116.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.116.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.117.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.117.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.117.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.118.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.118.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.118.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.119.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.119.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.119.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.120.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.120.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.120.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.121.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.121.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.121.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.122.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.122.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.122.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.123.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.123.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.123.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.124.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.124.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.124.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.125.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.125.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.125.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.126.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.126.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.126.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.127.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.127.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.127.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.128.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.128.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.128.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.129.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.129.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.129.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.130.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.130.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.130.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.131.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.131.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.131.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.132.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.132.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.132.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.133.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.133.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.133.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.134.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.134.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.134.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.135.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.135.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.135.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.136.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.136.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.136.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.137.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.137.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.137.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.138.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.138.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.138.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.139.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.139.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.139.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.140.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.140.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.140.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.141.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.141.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.141.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.142.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.142.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.142.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.143.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.143.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.143.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.144.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.144.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.144.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.145.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.145.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.145.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.146.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.146.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.146.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.147.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.147.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.147.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.148.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.148.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.148.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.149.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.149.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.149.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.150.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.150.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.150.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.151.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.151.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.151.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.152.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.152.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.152.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.153.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.153.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.153.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.154.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.154.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.154.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.155.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.155.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.155.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.156.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.156.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.156.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.157.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.157.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.157.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.158.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.158.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.158.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.159.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.159.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.159.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.160.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.160.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.160.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.161.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.161.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.161.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.162.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.162.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.162.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.163.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.163.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.163.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.164.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.164.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.164.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.165.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.165.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.165.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.166.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.166.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.166.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.167.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.167.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.167.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.168.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.168.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.168.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.169.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.169.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.169.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.170.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.170.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.170.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.171.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.171.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.171.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.172.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.172.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.172.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.173.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.173.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.173.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.174.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.174.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.174.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.175.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.175.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.175.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.176.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.176.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.176.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.177.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.177.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.177.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.178.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.178.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.178.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.179.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.179.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.179.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.180.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.180.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.180.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.181.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.181.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.181.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.182.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.182.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.182.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.183.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.183.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.183.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.184.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.184.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.184.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.185.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.185.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.185.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.186.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.186.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.186.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.187.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.187.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.187.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.188.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.188.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.188.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.189.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.189.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.189.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.190.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.190.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.190.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.191.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.191.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.191.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.192.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.192.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.192.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.193.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.193.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.193.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.194.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.194.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.194.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.195.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.195.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.195.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.196.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.196.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.196.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.197.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.197.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.197.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.198.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.198.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.198.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.199.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.199.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.199.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.200.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.200.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.200.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.201.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.201.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.201.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.202.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.202.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.202.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.203.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.203.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.203.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.204.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.204.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.204.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.205.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.205.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.205.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.206.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.206.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.206.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.207.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.207.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.207.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.208.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.208.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.208.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.209.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.209.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.209.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.210.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.210.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.210.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.211.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.211.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.211.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.212.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.212.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.212.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.213.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.213.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.213.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.214.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.214.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.214.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.215.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.215.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.215.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.216.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.216.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.216.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.217.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.217.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.217.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.218.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.218.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.218.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.219.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.219.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.219.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.220.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.220.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.220.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.221.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.221.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.221.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.222.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.222.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.222.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.223.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.223.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.223.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.224.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.224.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.224.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.225.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.225.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.225.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.226.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.226.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.226.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.227.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.227.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.227.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.228.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.228.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.228.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.229.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.229.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.229.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.230.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.230.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.230.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.231.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.231.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.231.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.232.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.232.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.232.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.233.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.233.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.233.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.234.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.234.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.234.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.235.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.235.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.235.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.236.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.236.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.236.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.237.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.237.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.237.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.238.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.238.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.238.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.239.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.239.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.239.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.240.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.240.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.240.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.241.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.241.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.241.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.242.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.242.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.242.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.243.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.243.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.243.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.244.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.244.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.244.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.245.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.245.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.245.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.246.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.246.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.246.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.247.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.247.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.247.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.248.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.248.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.248.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.249.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.249.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.249.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.250.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.250.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.250.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.251.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.251.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.251.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.252.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.252.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.252.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.253.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.253.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.253.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.254.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.254.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.254.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.255.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.255.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.255.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.input_layernorm.weight": "model-00018-of-000163.safetensors", + "model.layers.8.post_attention_layernorm.weight": "model-00018-of-000163.safetensors", + "model.layers.9.self_attn.q_a_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.self_attn.q_a_layernorm.weight": "model-00018-of-000163.safetensors", + "model.layers.9.self_attn.q_b_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.self_attn.kv_a_proj_with_mqa.weight": "model-00018-of-000163.safetensors", + "model.layers.9.self_attn.kv_a_layernorm.weight": "model-00018-of-000163.safetensors", + "model.layers.9.self_attn.kv_b_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.self_attn.o_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.gate.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.gate.e_score_correction_bias": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.shared_experts.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.shared_experts.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.shared_experts.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.0.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.0.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.0.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.1.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.1.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.1.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.2.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.2.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.2.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.3.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.3.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.3.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.4.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.4.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.4.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.5.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.5.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.5.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.6.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.6.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.6.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.7.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.7.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.7.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.8.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.8.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.8.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.9.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.9.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.9.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.10.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.10.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.10.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.11.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.11.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.11.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.12.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.12.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.12.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.13.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.13.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.13.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.14.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.14.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.14.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.15.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.15.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.15.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.16.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.16.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.16.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.17.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.17.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.17.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.18.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.18.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.18.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.19.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.19.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.19.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.20.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.20.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.20.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.21.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.21.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.21.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.22.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.22.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.22.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.23.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.23.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.23.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.24.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.24.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.24.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.25.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.25.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.25.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.26.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.26.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.26.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.27.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.27.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.27.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.28.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.28.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.28.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.29.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.29.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.29.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.30.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.30.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.30.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.31.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.31.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.31.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.32.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.32.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.32.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.33.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.33.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.33.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.34.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.34.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.34.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.35.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.35.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.35.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.36.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.36.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.36.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.37.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.37.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.37.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.38.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.38.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.38.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.39.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.39.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.39.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.40.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.40.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.40.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.41.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.41.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.41.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.42.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.42.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.42.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.43.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.43.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.43.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.44.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.44.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.44.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.45.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.45.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.45.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.46.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.46.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.46.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.47.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.47.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.47.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.48.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.48.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.48.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.49.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.49.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.49.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.50.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.50.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.50.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.51.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.51.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.51.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.52.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.52.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.52.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.53.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.53.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.53.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.54.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.54.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.54.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.55.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.55.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.55.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.56.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.56.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.56.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.57.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.57.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.57.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.58.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.58.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.58.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.59.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.59.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.59.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.60.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.60.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.60.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.61.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.61.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.61.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.62.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.62.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.62.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.63.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.63.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.63.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.64.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.64.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.64.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.65.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.65.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.65.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.66.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.66.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.66.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.67.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.67.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.67.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.68.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.68.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.68.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.69.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.69.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.69.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.70.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.70.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.70.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.71.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.71.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.71.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.72.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.72.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.72.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.73.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.73.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.73.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.74.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.74.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.74.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.75.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.75.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.75.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.76.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.76.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.76.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.77.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.77.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.77.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.78.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.78.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.78.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.79.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.79.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.79.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.80.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.80.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.80.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.81.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.81.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.81.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.82.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.82.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.82.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.83.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.83.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.83.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.84.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.84.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.84.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.85.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.85.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.85.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.86.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.86.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.86.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.87.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.87.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.87.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.88.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.88.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.88.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.89.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.89.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.89.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.90.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.90.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.90.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.91.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.91.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.91.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.92.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.92.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.92.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.93.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.93.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.93.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.94.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.94.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.94.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.95.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.95.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.95.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.96.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.96.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.96.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.97.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.97.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.97.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.98.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.98.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.98.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.99.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.99.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.99.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.100.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.100.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.100.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.101.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.101.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.101.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.102.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.102.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.102.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.103.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.103.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.103.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.104.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.104.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.104.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.105.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.105.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.105.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.106.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.106.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.106.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.107.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.107.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.107.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.108.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.108.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.108.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.109.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.109.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.109.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.110.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.110.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.110.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.111.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.111.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.111.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.112.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.112.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.112.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.113.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.113.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.113.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.114.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.114.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.114.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.115.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.115.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.115.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.116.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.116.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.116.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.117.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.117.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.117.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.118.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.118.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.118.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.119.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.119.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.119.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.120.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.120.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.120.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.121.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.121.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.121.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.122.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.122.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.122.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.123.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.123.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.123.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.124.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.124.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.124.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.125.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.125.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.125.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.126.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.126.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.126.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.127.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.127.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.127.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.128.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.128.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.128.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.129.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.129.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.129.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.130.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.130.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.130.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.131.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.131.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.131.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.132.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.132.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.132.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.133.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.133.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.133.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.134.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.134.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.134.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.135.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.135.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.135.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.136.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.136.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.136.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.137.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.137.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.137.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.138.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.138.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.138.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.139.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.139.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.139.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.140.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.140.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.140.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.141.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.141.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.141.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.142.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.142.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.142.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.143.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.143.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.143.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.144.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.144.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.144.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.145.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.145.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.145.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.146.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.146.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.146.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.147.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.147.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.147.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.148.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.148.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.148.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.149.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.149.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.149.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.150.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.150.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.150.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.151.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.151.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.151.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.152.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.152.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.152.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.153.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.153.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.153.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.154.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.154.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.154.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.155.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.155.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.155.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.156.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.156.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.156.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.157.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.157.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.157.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.158.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.158.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.158.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.159.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.159.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.159.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.160.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.160.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.160.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.161.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.161.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.161.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.162.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.162.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.162.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.163.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.163.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.163.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.164.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.164.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.164.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.165.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.165.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.165.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.166.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.166.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.166.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.167.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.167.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.167.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.168.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.168.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.168.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.169.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.169.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.169.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.170.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.170.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.170.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.171.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.171.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.171.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.172.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.172.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.172.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.173.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.173.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.173.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.174.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.174.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.174.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.175.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.175.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.175.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.176.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.176.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.176.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.177.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.177.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.177.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.178.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.178.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.178.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.179.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.179.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.179.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.180.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.180.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.180.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.181.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.181.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.181.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.182.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.182.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.182.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.183.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.183.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.183.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.184.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.184.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.184.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.185.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.185.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.185.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.186.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.186.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.186.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.187.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.187.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.187.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.188.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.188.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.188.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.189.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.189.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.189.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.190.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.190.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.190.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.191.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.191.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.191.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.192.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.192.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.192.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.193.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.193.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.193.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.194.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.194.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.194.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.195.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.195.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.195.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.196.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.196.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.196.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.197.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.197.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.197.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.198.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.198.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.198.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.199.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.199.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.199.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.200.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.200.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.200.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.201.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.201.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.201.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.202.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.202.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.202.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.203.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.203.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.203.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.204.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.204.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.204.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.205.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.205.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.205.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.206.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.206.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.206.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.207.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.207.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.207.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.208.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.208.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.208.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.209.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.209.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.209.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.210.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.210.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.210.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.211.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.211.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.211.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.212.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.212.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.212.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.213.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.213.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.213.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.214.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.214.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.214.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.215.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.215.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.215.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.216.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.216.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.216.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.217.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.217.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.217.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.218.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.218.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.218.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.219.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.219.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.219.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.220.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.220.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.220.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.221.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.221.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.221.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.222.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.222.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.222.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.223.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.223.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.223.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.224.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.224.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.224.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.225.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.225.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.225.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.226.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.226.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.226.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.227.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.227.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.227.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.228.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.228.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.228.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.229.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.229.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.229.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.230.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.230.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.230.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.231.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.231.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.231.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.232.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.232.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.232.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.233.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.233.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.233.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.234.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.234.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.234.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.235.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.235.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.235.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.236.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.236.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.236.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.237.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.237.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.237.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.238.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.238.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.238.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.239.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.239.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.239.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.240.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.240.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.240.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.241.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.241.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.241.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.242.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.242.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.242.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.243.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.243.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.243.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.244.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.244.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.244.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.245.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.245.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.245.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.246.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.246.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.246.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.247.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.247.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.247.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.248.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.248.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.248.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.249.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.249.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.249.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.250.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.250.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.250.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.251.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.251.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.251.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.252.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.252.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.252.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.253.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.253.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.9.mlp.experts.253.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.9.mlp.experts.254.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.9.mlp.experts.254.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.9.mlp.experts.254.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.9.mlp.experts.255.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.9.mlp.experts.255.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.9.mlp.experts.255.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.9.input_layernorm.weight": "model-00021-of-000163.safetensors", + "model.layers.9.post_attention_layernorm.weight": "model-00021-of-000163.safetensors", + "model.layers.10.self_attn.q_a_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.self_attn.q_a_layernorm.weight": "model-00021-of-000163.safetensors", + "model.layers.10.self_attn.q_b_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.self_attn.kv_a_proj_with_mqa.weight": "model-00021-of-000163.safetensors", + "model.layers.10.self_attn.kv_a_layernorm.weight": "model-00021-of-000163.safetensors", + "model.layers.10.self_attn.kv_b_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.self_attn.o_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.gate.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.gate.e_score_correction_bias": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.shared_experts.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.shared_experts.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.shared_experts.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.0.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.0.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.0.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.1.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.1.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.1.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.2.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.2.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.2.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.3.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.3.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.3.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.4.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.4.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.4.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.5.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.5.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.5.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.6.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.6.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.6.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.7.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.7.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.7.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.8.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.8.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.8.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.9.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.9.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.9.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.10.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.10.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.10.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.11.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.11.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.11.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.12.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.12.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.12.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.13.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.13.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.13.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.14.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.14.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.14.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.15.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.15.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.15.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.16.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.16.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.16.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.17.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.17.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.17.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.18.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.18.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.18.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.19.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.19.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.19.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.20.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.20.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.20.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.21.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.21.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.21.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.22.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.22.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.22.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.23.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.23.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.23.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.24.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.24.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.24.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.25.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.25.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.25.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.26.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.26.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.26.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.27.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.27.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.27.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.28.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.28.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.28.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.29.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.29.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.29.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.30.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.30.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.30.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.31.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.31.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.31.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.32.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.32.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.32.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.33.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.33.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.33.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.34.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.34.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.34.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.35.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.35.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.35.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.36.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.36.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.36.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.37.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.37.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.37.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.38.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.38.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.38.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.39.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.39.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.39.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.40.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.40.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.40.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.41.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.41.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.41.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.42.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.42.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.42.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.43.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.43.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.43.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.44.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.44.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.44.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.45.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.45.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.45.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.46.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.46.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.46.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.47.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.47.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.47.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.48.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.48.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.48.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.49.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.49.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.49.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.50.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.50.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.50.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.51.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.51.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.51.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.52.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.52.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.52.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.53.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.53.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.53.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.54.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.54.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.54.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.55.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.55.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.55.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.56.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.56.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.56.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.57.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.57.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.57.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.58.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.58.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.58.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.59.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.59.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.59.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.60.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.60.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.60.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.61.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.61.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.61.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.62.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.62.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.62.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.63.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.63.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.63.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.64.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.64.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.64.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.65.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.65.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.65.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.66.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.66.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.66.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.67.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.67.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.67.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.68.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.68.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.68.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.69.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.69.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.69.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.70.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.70.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.70.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.71.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.71.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.71.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.72.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.72.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.72.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.73.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.73.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.73.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.74.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.74.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.74.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.75.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.75.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.75.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.76.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.76.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.76.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.77.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.77.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.77.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.78.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.78.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.78.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.79.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.79.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.79.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.80.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.80.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.80.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.81.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.81.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.81.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.82.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.82.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.82.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.83.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.83.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.83.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.84.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.84.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.84.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.85.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.85.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.85.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.86.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.86.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.86.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.87.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.87.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.87.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.88.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.88.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.88.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.89.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.89.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.89.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.90.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.90.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.90.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.91.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.91.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.91.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.92.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.92.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.92.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.93.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.93.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.93.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.94.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.94.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.94.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.95.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.95.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.95.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.96.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.96.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.96.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.97.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.97.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.97.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.98.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.98.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.98.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.99.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.99.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.99.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.100.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.100.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.100.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.101.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.101.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.101.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.102.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.102.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.102.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.103.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.103.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.103.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.104.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.104.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.104.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.105.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.105.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.105.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.106.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.106.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.106.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.107.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.107.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.107.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.108.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.108.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.108.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.109.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.109.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.109.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.110.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.110.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.110.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.111.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.111.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.111.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.112.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.112.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.112.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.113.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.113.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.113.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.114.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.114.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.114.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.115.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.115.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.115.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.116.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.116.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.116.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.117.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.117.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.117.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.118.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.118.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.118.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.119.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.119.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.119.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.120.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.120.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.120.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.121.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.121.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.121.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.122.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.122.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.122.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.123.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.123.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.123.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.124.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.124.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.124.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.125.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.125.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.125.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.126.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.126.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.126.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.127.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.127.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.127.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.128.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.128.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.128.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.129.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.129.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.129.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.130.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.130.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.130.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.131.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.131.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.131.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.132.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.132.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.132.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.133.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.133.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.133.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.134.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.134.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.134.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.135.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.135.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.135.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.136.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.136.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.136.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.137.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.137.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.137.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.138.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.138.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.138.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.139.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.139.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.139.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.140.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.140.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.140.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.141.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.141.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.141.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.142.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.142.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.142.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.143.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.143.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.143.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.144.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.144.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.144.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.145.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.145.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.145.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.146.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.146.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.146.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.147.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.147.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.147.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.148.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.148.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.148.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.149.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.149.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.149.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.150.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.150.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.150.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.151.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.151.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.151.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.152.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.152.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.152.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.153.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.153.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.153.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.154.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.154.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.154.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.155.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.155.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.155.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.156.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.156.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.156.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.157.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.157.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.157.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.158.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.158.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.158.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.159.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.159.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.159.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.160.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.160.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.160.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.161.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.161.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.161.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.162.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.162.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.162.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.163.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.163.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.163.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.164.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.164.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.164.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.165.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.165.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.165.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.166.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.166.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.166.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.167.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.167.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.167.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.168.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.168.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.168.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.169.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.169.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.169.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.170.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.170.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.170.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.171.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.171.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.171.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.172.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.172.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.172.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.173.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.173.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.173.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.174.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.174.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.174.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.175.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.175.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.175.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.176.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.176.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.176.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.177.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.177.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.177.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.178.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.178.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.178.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.179.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.179.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.179.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.180.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.180.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.180.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.181.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.181.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.181.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.182.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.182.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.182.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.183.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.183.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.183.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.184.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.184.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.184.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.185.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.185.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.185.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.186.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.186.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.186.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.187.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.187.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.187.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.188.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.188.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.188.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.189.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.189.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.189.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.190.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.190.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.190.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.191.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.191.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.191.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.192.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.192.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.192.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.193.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.193.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.193.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.194.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.194.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.194.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.195.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.195.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.195.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.196.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.196.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.196.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.197.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.197.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.197.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.198.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.198.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.198.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.199.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.199.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.199.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.200.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.200.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.200.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.201.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.201.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.201.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.202.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.202.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.202.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.203.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.203.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.203.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.204.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.204.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.204.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.205.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.205.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.205.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.206.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.206.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.206.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.207.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.207.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.207.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.208.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.208.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.208.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.209.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.209.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.209.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.210.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.210.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.210.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.211.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.211.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.211.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.212.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.212.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.212.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.213.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.213.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.213.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.214.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.214.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.214.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.215.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.215.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.215.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.216.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.216.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.216.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.217.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.217.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.217.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.218.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.218.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.218.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.219.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.219.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.219.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.220.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.220.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.220.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.221.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.221.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.221.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.222.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.222.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.222.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.223.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.223.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.223.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.224.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.224.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.224.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.225.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.225.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.225.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.226.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.226.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.226.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.227.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.227.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.227.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.228.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.228.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.228.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.229.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.229.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.229.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.230.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.230.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.230.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.231.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.231.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.231.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.232.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.232.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.232.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.233.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.233.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.233.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.234.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.234.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.234.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.235.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.235.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.235.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.236.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.236.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.236.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.237.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.237.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.237.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.238.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.238.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.238.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.239.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.239.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.239.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.240.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.240.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.240.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.241.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.241.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.241.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.242.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.242.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.242.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.243.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.243.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.243.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.244.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.244.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.244.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.245.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.245.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.245.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.246.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.246.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.246.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.247.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.247.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.247.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.248.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.248.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.248.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.249.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.249.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.249.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.250.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.250.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.250.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.251.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.251.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.251.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.252.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.252.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.252.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.253.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.253.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.253.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.254.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.254.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.254.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.255.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.255.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.255.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.input_layernorm.weight": "model-00023-of-000163.safetensors", + "model.layers.10.post_attention_layernorm.weight": "model-00023-of-000163.safetensors", + "model.layers.11.self_attn.q_a_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.self_attn.q_a_layernorm.weight": "model-00023-of-000163.safetensors", + "model.layers.11.self_attn.q_b_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.self_attn.kv_a_proj_with_mqa.weight": "model-00023-of-000163.safetensors", + "model.layers.11.self_attn.kv_a_layernorm.weight": "model-00023-of-000163.safetensors", + "model.layers.11.self_attn.kv_b_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.self_attn.o_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.gate.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.gate.e_score_correction_bias": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.shared_experts.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.shared_experts.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.shared_experts.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.0.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.0.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.0.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.1.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.1.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.1.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.2.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.2.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.2.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.3.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.3.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.3.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.4.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.4.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.4.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.5.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.5.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.5.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.6.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.6.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.6.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.7.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.7.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.7.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.8.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.8.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.8.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.9.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.9.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.9.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.10.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.10.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.10.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.11.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.11.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.11.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.12.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.12.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.12.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.13.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.13.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.13.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.14.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.14.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.14.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.15.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.15.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.15.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.16.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.16.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.16.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.17.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.17.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.17.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.18.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.18.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.18.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.19.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.19.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.19.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.20.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.20.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.20.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.21.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.21.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.21.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.22.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.22.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.22.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.23.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.23.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.23.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.24.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.24.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.24.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.25.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.25.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.25.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.26.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.26.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.26.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.27.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.27.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.27.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.28.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.28.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.28.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.29.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.29.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.29.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.30.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.30.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.30.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.31.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.31.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.31.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.32.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.32.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.32.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.33.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.33.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.33.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.34.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.34.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.34.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.35.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.35.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.35.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.36.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.36.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.36.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.37.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.37.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.37.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.38.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.38.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.38.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.39.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.39.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.39.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.40.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.40.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.40.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.41.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.41.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.41.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.42.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.42.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.42.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.43.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.43.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.43.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.44.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.44.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.44.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.45.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.45.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.45.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.46.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.46.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.46.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.47.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.47.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.47.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.48.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.48.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.48.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.49.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.49.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.49.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.50.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.50.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.50.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.51.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.51.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.51.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.52.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.52.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.52.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.53.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.53.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.53.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.54.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.54.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.54.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.55.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.55.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.55.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.56.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.56.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.56.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.57.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.57.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.57.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.58.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.58.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.58.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.59.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.59.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.59.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.60.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.60.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.60.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.61.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.61.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.61.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.62.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.62.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.62.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.63.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.63.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.63.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.64.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.64.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.64.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.65.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.65.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.65.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.66.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.66.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.66.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.67.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.67.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.67.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.68.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.68.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.68.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.69.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.69.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.69.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.70.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.70.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.70.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.71.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.71.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.71.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.72.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.72.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.72.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.73.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.73.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.73.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.74.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.74.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.74.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.75.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.75.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.75.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.76.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.76.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.76.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.77.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.77.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.77.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.78.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.78.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.78.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.79.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.79.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.79.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.80.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.80.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.80.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.81.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.81.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.81.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.82.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.82.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.82.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.83.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.83.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.83.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.84.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.84.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.84.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.85.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.85.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.85.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.86.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.86.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.86.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.87.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.87.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.87.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.88.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.88.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.88.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.89.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.89.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.89.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.90.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.90.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.90.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.91.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.91.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.91.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.92.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.92.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.92.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.93.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.93.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.93.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.94.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.94.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.94.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.95.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.95.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.95.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.96.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.96.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.96.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.97.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.97.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.97.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.98.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.98.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.98.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.99.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.99.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.99.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.100.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.100.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.100.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.101.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.101.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.101.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.102.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.102.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.102.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.103.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.103.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.103.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.104.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.104.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.104.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.105.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.105.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.105.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.106.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.106.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.106.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.107.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.107.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.107.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.108.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.108.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.108.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.109.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.109.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.109.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.110.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.110.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.110.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.111.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.111.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.111.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.112.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.112.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.112.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.113.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.113.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.113.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.114.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.114.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.114.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.115.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.115.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.115.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.116.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.116.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.116.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.117.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.117.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.117.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.118.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.118.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.118.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.119.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.119.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.119.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.120.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.120.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.120.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.121.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.121.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.121.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.122.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.122.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.122.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.123.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.123.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.123.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.124.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.124.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.124.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.125.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.125.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.125.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.126.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.126.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.126.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.127.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.127.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.127.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.128.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.128.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.128.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.129.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.129.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.129.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.130.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.130.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.130.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.131.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.131.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.131.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.132.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.132.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.132.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.133.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.133.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.133.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.134.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.134.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.134.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.135.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.135.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.135.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.136.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.136.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.136.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.137.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.137.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.137.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.138.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.138.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.138.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.139.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.139.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.139.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.140.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.140.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.140.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.141.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.141.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.141.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.142.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.142.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.142.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.143.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.143.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.143.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.144.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.144.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.144.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.145.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.145.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.145.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.146.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.146.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.146.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.147.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.147.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.147.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.148.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.148.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.148.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.149.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.149.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.149.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.150.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.150.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.150.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.151.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.151.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.151.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.152.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.152.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.152.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.153.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.153.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.153.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.154.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.154.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.154.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.155.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.155.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.155.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.156.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.156.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.156.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.157.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.157.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.157.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.158.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.158.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.158.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.159.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.159.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.159.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.160.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.160.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.160.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.161.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.161.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.161.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.162.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.162.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.162.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.163.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.163.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.163.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.164.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.164.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.164.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.165.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.165.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.165.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.166.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.166.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.166.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.167.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.167.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.167.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.168.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.168.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.168.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.169.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.169.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.169.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.170.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.170.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.170.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.171.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.171.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.171.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.172.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.172.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.172.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.173.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.173.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.173.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.174.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.174.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.174.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.175.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.175.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.175.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.176.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.176.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.176.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.177.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.177.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.177.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.178.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.178.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.178.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.179.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.179.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.179.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.180.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.180.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.180.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.181.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.181.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.181.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.182.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.182.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.182.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.183.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.183.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.183.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.184.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.184.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.184.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.185.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.185.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.185.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.186.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.186.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.186.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.187.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.187.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.187.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.188.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.188.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.188.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.189.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.189.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.189.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.190.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.190.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.190.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.191.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.191.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.191.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.192.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.192.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.192.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.193.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.193.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.193.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.194.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.194.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.194.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.195.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.195.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.195.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.196.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.196.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.196.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.197.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.197.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.197.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.198.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.198.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.198.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.199.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.199.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.199.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.200.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.200.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.200.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.201.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.201.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.201.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.202.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.202.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.202.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.203.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.203.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.203.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.204.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.204.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.204.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.205.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.205.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.205.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.206.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.206.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.206.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.207.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.207.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.207.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.208.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.208.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.208.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.209.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.209.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.209.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.210.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.210.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.210.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.211.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.211.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.211.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.212.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.212.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.212.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.213.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.213.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.213.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.214.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.214.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.214.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.215.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.215.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.215.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.216.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.216.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.216.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.217.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.217.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.217.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.218.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.218.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.218.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.219.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.219.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.219.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.220.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.220.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.220.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.221.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.221.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.221.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.222.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.222.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.222.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.223.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.223.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.223.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.224.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.224.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.224.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.225.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.225.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.225.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.226.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.226.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.226.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.227.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.227.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.227.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.228.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.228.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.228.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.229.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.229.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.229.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.230.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.230.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.230.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.231.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.231.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.231.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.232.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.232.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.232.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.233.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.233.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.233.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.234.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.234.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.234.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.235.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.235.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.235.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.236.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.236.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.236.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.237.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.237.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.237.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.238.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.238.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.238.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.239.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.239.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.239.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.240.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.240.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.240.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.241.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.241.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.241.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.242.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.242.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.242.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.243.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.243.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.243.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.244.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.244.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.244.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.245.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.245.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.245.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.246.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.246.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.246.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.247.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.247.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.247.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.248.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.248.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.248.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.249.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.249.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.249.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.250.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.250.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.250.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.251.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.251.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.251.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.252.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.252.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.252.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.253.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.253.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.253.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.254.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.254.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.254.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.255.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.255.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.255.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.input_layernorm.weight": "model-00026-of-000163.safetensors", + "model.layers.11.post_attention_layernorm.weight": "model-00026-of-000163.safetensors", + "model.layers.12.self_attn.q_a_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.self_attn.q_a_layernorm.weight": "model-00026-of-000163.safetensors", + "model.layers.12.self_attn.q_b_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.self_attn.kv_a_proj_with_mqa.weight": "model-00026-of-000163.safetensors", + "model.layers.12.self_attn.kv_a_layernorm.weight": "model-00026-of-000163.safetensors", + "model.layers.12.self_attn.kv_b_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.self_attn.o_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.gate.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.gate.e_score_correction_bias": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.shared_experts.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.shared_experts.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.shared_experts.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.0.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.0.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.0.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.1.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.1.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.1.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.2.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.2.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.2.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.3.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.3.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.3.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.4.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.4.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.4.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.5.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.5.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.5.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.6.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.6.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.6.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.7.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.7.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.7.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.8.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.8.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.8.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.9.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.9.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.9.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.10.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.10.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.10.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.11.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.11.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.11.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.12.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.12.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.12.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.13.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.13.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.13.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.14.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.14.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.14.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.15.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.15.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.15.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.16.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.16.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.16.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.17.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.17.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.17.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.18.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.18.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.18.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.19.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.19.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.19.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.20.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.20.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.20.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.21.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.21.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.21.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.22.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.22.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.22.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.23.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.23.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.23.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.24.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.24.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.24.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.25.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.25.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.25.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.26.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.26.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.26.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.27.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.27.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.27.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.28.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.28.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.28.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.29.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.29.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.29.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.30.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.30.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.30.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.31.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.31.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.31.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.32.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.32.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.32.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.33.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.33.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.33.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.34.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.34.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.34.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.35.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.35.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.35.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.36.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.36.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.36.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.37.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.37.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.37.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.38.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.38.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.38.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.39.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.39.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.39.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.40.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.40.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.40.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.41.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.41.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.41.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.42.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.42.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.42.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.43.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.43.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.43.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.44.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.44.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.44.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.45.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.45.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.45.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.46.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.46.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.46.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.47.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.47.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.47.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.48.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.48.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.48.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.49.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.49.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.49.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.50.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.50.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.50.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.51.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.51.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.51.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.52.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.52.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.52.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.53.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.53.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.53.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.54.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.54.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.54.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.55.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.55.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.55.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.56.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.56.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.56.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.57.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.57.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.57.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.58.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.58.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.58.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.59.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.59.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.59.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.60.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.60.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.60.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.61.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.61.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.61.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.62.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.62.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.62.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.63.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.63.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.63.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.64.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.64.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.64.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.65.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.65.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.65.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.66.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.66.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.66.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.67.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.67.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.67.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.68.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.68.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.68.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.69.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.69.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.69.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.70.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.70.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.70.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.71.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.71.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.71.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.72.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.72.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.72.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.73.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.73.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.73.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.74.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.74.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.74.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.75.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.75.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.75.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.76.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.76.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.76.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.77.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.77.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.77.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.78.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.78.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.78.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.79.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.79.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.79.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.80.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.80.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.80.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.81.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.81.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.81.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.82.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.82.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.82.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.83.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.83.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.83.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.84.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.84.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.84.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.85.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.85.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.85.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.86.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.86.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.86.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.87.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.87.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.87.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.88.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.88.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.88.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.89.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.89.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.89.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.90.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.90.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.90.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.91.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.91.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.91.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.92.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.92.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.92.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.93.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.93.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.93.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.94.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.94.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.94.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.95.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.95.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.95.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.96.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.96.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.96.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.97.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.97.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.97.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.98.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.98.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.98.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.99.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.99.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.99.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.100.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.100.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.100.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.101.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.101.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.101.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.102.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.102.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.102.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.103.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.103.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.103.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.104.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.104.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.104.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.105.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.105.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.105.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.106.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.106.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.106.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.107.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.107.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.107.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.108.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.108.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.108.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.109.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.109.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.109.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.110.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.110.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.110.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.111.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.111.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.111.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.112.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.112.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.112.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.113.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.113.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.113.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.114.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.114.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.114.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.115.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.115.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.115.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.116.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.116.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.116.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.117.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.117.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.117.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.118.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.118.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.118.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.119.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.119.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.119.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.120.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.120.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.120.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.121.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.121.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.121.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.122.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.122.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.122.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.123.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.123.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.123.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.124.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.124.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.124.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.125.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.125.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.125.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.126.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.126.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.126.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.127.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.127.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.127.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.128.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.128.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.128.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.129.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.129.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.129.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.130.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.130.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.130.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.131.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.131.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.131.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.132.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.132.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.132.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.133.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.133.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.133.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.134.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.134.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.134.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.135.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.135.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.135.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.136.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.136.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.136.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.137.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.137.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.137.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.138.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.138.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.138.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.139.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.139.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.139.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.140.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.140.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.140.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.141.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.141.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.141.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.142.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.142.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.142.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.143.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.143.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.143.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.144.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.144.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.144.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.145.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.145.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.145.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.146.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.146.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.146.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.147.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.147.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.147.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.148.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.148.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.148.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.149.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.149.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.149.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.150.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.150.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.150.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.151.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.151.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.151.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.152.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.152.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.152.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.153.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.153.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.153.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.154.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.154.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.154.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.155.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.155.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.155.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.156.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.156.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.156.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.157.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.157.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.157.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.158.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.158.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.158.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.159.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.159.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.159.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.160.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.160.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.160.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.161.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.161.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.161.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.162.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.162.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.162.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.163.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.163.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.163.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.164.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.164.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.164.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.165.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.165.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.165.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.166.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.166.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.166.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.167.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.167.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.167.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.168.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.168.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.168.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.169.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.169.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.169.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.170.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.170.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.170.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.171.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.171.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.171.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.172.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.172.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.172.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.173.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.173.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.173.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.174.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.174.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.174.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.175.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.175.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.175.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.176.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.176.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.176.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.177.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.177.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.177.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.178.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.178.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.178.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.179.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.179.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.179.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.180.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.180.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.180.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.181.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.181.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.181.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.182.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.182.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.182.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.183.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.183.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.183.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.184.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.184.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.184.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.185.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.185.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.185.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.186.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.186.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.186.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.187.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.187.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.187.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.188.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.188.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.188.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.189.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.189.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.189.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.190.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.190.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.190.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.191.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.191.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.191.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.192.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.192.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.192.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.193.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.193.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.193.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.194.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.194.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.194.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.195.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.195.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.195.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.196.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.196.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.196.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.197.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.197.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.197.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.198.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.198.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.198.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.199.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.199.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.199.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.200.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.200.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.200.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.201.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.201.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.201.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.202.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.202.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.202.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.203.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.203.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.203.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.204.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.204.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.204.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.205.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.205.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.205.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.206.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.206.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.206.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.207.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.207.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.207.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.208.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.208.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.208.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.209.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.209.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.209.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.210.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.210.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.210.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.211.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.211.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.211.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.212.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.212.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.212.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.213.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.213.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.213.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.214.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.214.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.214.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.215.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.215.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.215.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.216.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.216.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.216.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.217.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.217.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.217.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.218.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.218.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.218.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.219.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.219.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.219.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.220.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.220.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.220.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.221.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.221.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.221.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.222.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.222.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.222.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.223.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.223.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.223.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.224.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.224.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.224.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.225.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.225.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.225.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.226.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.226.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.226.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.227.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.227.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.227.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.228.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.228.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.228.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.229.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.229.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.229.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.230.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.230.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.230.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.231.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.231.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.231.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.232.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.232.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.232.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.233.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.233.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.233.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.234.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.234.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.234.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.235.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.235.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.235.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.236.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.236.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.236.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.237.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.237.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.237.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.238.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.238.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.238.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.239.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.239.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.239.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.240.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.240.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.240.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.241.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.241.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.241.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.242.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.242.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.242.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.243.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.243.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.243.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.244.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.244.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.244.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.245.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.245.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.245.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.246.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.246.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.246.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.247.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.247.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.247.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.248.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.248.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.248.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.249.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.249.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.249.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.250.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.250.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.250.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.251.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.251.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.251.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.252.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.252.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.252.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.253.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.253.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.253.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.254.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.254.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.254.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.255.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.255.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.255.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.input_layernorm.weight": "model-00029-of-000163.safetensors", + "model.layers.12.post_attention_layernorm.weight": "model-00029-of-000163.safetensors", + "model.layers.13.self_attn.q_a_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.self_attn.q_a_layernorm.weight": "model-00029-of-000163.safetensors", + "model.layers.13.self_attn.q_b_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.self_attn.kv_a_proj_with_mqa.weight": "model-00029-of-000163.safetensors", + "model.layers.13.self_attn.kv_a_layernorm.weight": "model-00029-of-000163.safetensors", + "model.layers.13.self_attn.kv_b_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.self_attn.o_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.gate.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.gate.e_score_correction_bias": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.shared_experts.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.shared_experts.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.shared_experts.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.0.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.0.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.0.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.1.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.1.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.1.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.2.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.2.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.2.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.3.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.3.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.3.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.4.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.4.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.4.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.5.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.5.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.5.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.6.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.6.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.6.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.7.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.7.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.7.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.8.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.8.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.8.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.9.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.9.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.9.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.10.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.10.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.10.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.11.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.11.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.11.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.12.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.12.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.12.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.13.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.13.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.13.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.14.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.14.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.14.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.15.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.15.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.15.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.16.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.16.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.16.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.17.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.17.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.17.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.18.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.18.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.18.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.19.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.19.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.19.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.20.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.20.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.20.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.21.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.21.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.21.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.22.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.22.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.22.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.23.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.23.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.23.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.24.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.24.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.24.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.25.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.25.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.25.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.26.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.26.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.26.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.27.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.27.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.27.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.28.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.28.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.28.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.29.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.29.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.29.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.30.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.30.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.30.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.31.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.31.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.31.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.32.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.32.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.32.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.33.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.33.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.33.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.34.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.34.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.34.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.35.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.35.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.35.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.36.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.36.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.36.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.37.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.37.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.37.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.38.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.38.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.38.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.39.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.39.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.39.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.40.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.40.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.40.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.41.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.41.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.41.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.42.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.42.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.42.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.43.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.43.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.43.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.44.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.44.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.44.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.45.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.45.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.45.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.46.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.46.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.46.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.47.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.47.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.47.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.48.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.48.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.48.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.49.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.49.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.49.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.50.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.50.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.50.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.51.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.51.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.51.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.52.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.52.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.52.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.53.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.53.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.53.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.54.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.54.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.54.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.55.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.55.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.55.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.56.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.56.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.56.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.57.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.57.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.57.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.58.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.58.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.58.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.59.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.59.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.59.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.60.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.60.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.60.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.61.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.61.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.61.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.62.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.62.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.62.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.63.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.63.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.63.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.64.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.64.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.64.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.65.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.65.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.65.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.66.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.66.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.66.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.67.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.67.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.67.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.68.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.68.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.68.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.69.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.69.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.69.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.70.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.70.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.70.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.71.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.71.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.71.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.72.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.72.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.72.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.73.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.73.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.73.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.74.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.74.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.74.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.75.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.75.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.75.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.76.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.76.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.76.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.77.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.77.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.77.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.78.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.78.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.78.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.79.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.79.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.79.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.80.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.80.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.80.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.81.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.81.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.81.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.82.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.82.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.82.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.83.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.83.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.83.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.84.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.84.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.84.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.85.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.85.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.85.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.86.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.86.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.86.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.87.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.87.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.87.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.88.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.88.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.88.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.89.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.89.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.89.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.90.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.90.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.90.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.91.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.91.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.91.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.92.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.92.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.92.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.93.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.93.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.93.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.94.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.94.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.94.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.95.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.95.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.95.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.96.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.96.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.96.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.97.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.97.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.97.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.98.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.98.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.98.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.99.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.99.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.99.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.100.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.100.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.100.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.101.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.101.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.101.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.102.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.102.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.102.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.103.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.103.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.103.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.104.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.104.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.104.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.105.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.105.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.105.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.106.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.106.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.106.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.107.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.107.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.107.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.108.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.108.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.108.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.109.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.109.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.109.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.110.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.110.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.110.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.111.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.111.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.111.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.112.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.112.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.112.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.113.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.113.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.113.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.114.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.114.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.114.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.115.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.115.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.115.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.116.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.116.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.116.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.117.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.117.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.117.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.118.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.118.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.118.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.119.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.119.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.119.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.120.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.120.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.120.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.121.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.121.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.121.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.122.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.122.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.122.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.123.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.123.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.123.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.124.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.124.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.124.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.125.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.125.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.125.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.126.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.126.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.126.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.127.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.127.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.127.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.128.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.128.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.128.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.129.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.129.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.129.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.130.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.130.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.130.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.131.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.131.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.131.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.132.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.132.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.132.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.133.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.133.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.133.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.134.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.134.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.134.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.135.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.135.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.135.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.136.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.136.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.136.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.137.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.137.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.137.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.138.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.138.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.138.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.139.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.139.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.139.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.140.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.140.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.140.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.141.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.141.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.141.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.142.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.142.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.142.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.143.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.143.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.143.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.144.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.144.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.144.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.145.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.145.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.145.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.146.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.146.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.146.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.147.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.147.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.147.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.148.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.148.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.148.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.149.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.149.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.149.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.150.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.150.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.150.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.151.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.151.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.151.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.152.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.152.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.152.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.153.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.153.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.153.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.154.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.154.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.154.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.155.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.155.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.155.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.156.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.156.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.156.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.157.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.157.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.157.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.158.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.158.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.158.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.159.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.159.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.159.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.160.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.160.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.160.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.161.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.161.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.161.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.162.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.162.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.162.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.163.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.163.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.163.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.164.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.164.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.164.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.165.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.165.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.165.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.166.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.166.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.166.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.167.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.167.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.167.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.168.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.168.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.168.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.169.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.169.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.169.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.170.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.170.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.170.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.171.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.171.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.171.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.172.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.172.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.172.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.173.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.173.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.173.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.174.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.174.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.174.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.175.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.175.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.175.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.176.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.176.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.176.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.177.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.177.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.177.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.178.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.178.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.178.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.179.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.179.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.179.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.180.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.180.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.180.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.181.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.181.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.181.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.182.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.182.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.182.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.183.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.183.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.183.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.184.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.184.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.184.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.185.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.185.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.185.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.186.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.186.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.186.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.187.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.187.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.187.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.188.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.188.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.188.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.189.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.189.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.189.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.190.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.190.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.190.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.191.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.191.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.191.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.192.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.192.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.192.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.193.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.193.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.193.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.194.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.194.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.194.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.195.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.195.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.195.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.196.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.196.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.196.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.197.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.197.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.197.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.198.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.198.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.198.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.199.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.199.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.199.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.200.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.200.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.200.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.201.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.201.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.201.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.202.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.202.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.202.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.203.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.203.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.203.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.204.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.204.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.204.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.205.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.205.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.205.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.206.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.206.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.206.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.207.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.207.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.207.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.208.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.208.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.208.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.209.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.209.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.209.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.210.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.210.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.210.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.211.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.211.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.211.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.212.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.212.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.212.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.213.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.213.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.213.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.214.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.214.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.214.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.215.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.215.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.215.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.216.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.216.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.216.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.217.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.217.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.217.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.218.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.218.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.218.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.219.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.219.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.219.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.220.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.220.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.220.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.221.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.221.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.221.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.222.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.222.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.222.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.223.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.223.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.223.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.224.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.224.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.224.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.225.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.225.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.225.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.226.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.226.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.226.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.227.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.227.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.227.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.228.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.228.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.228.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.229.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.229.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.229.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.230.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.230.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.230.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.231.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.231.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.231.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.232.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.232.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.232.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.233.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.233.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.233.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.234.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.234.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.234.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.235.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.235.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.235.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.236.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.236.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.236.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.237.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.237.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.237.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.238.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.238.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.238.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.239.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.239.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.239.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.240.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.240.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.240.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.241.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.241.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.241.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.242.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.242.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.242.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.243.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.243.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.243.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.244.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.244.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.244.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.245.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.245.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.245.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.246.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.246.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.246.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.247.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.247.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.247.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.248.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.248.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.248.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.249.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.249.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.249.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.250.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.250.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.250.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.251.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.251.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.251.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.252.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.252.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.252.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.253.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.253.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.253.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.254.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.254.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.254.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.255.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.255.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.255.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.input_layernorm.weight": "model-00031-of-000163.safetensors", + "model.layers.13.post_attention_layernorm.weight": "model-00031-of-000163.safetensors", + "model.layers.14.self_attn.q_a_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.self_attn.q_a_layernorm.weight": "model-00031-of-000163.safetensors", + "model.layers.14.self_attn.q_b_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.self_attn.kv_a_proj_with_mqa.weight": "model-00031-of-000163.safetensors", + "model.layers.14.self_attn.kv_a_layernorm.weight": "model-00031-of-000163.safetensors", + "model.layers.14.self_attn.kv_b_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.self_attn.o_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.gate.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.gate.e_score_correction_bias": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.shared_experts.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.shared_experts.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.shared_experts.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.0.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.0.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.0.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.1.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.1.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.1.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.2.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.2.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.2.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.3.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.3.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.3.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.4.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.4.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.4.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.5.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.5.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.5.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.6.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.6.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.6.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.7.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.7.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.7.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.8.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.8.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.8.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.9.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.9.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.9.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.10.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.10.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.10.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.11.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.11.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.11.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.12.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.12.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.12.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.13.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.13.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.13.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.14.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.14.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.14.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.15.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.15.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.15.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.16.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.16.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.16.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.17.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.17.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.17.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.18.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.18.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.18.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.19.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.19.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.19.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.20.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.20.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.20.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.21.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.21.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.21.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.22.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.22.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.22.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.23.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.23.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.23.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.24.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.24.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.24.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.25.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.25.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.25.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.26.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.26.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.26.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.27.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.27.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.27.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.28.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.28.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.28.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.29.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.29.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.29.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.30.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.30.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.30.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.31.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.31.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.31.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.32.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.32.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.32.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.33.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.33.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.33.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.34.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.34.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.34.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.35.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.35.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.35.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.36.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.36.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.36.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.37.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.37.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.37.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.38.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.38.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.38.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.39.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.39.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.39.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.40.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.40.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.40.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.41.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.41.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.41.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.42.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.42.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.42.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.43.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.43.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.43.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.44.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.44.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.44.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.45.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.45.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.45.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.46.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.46.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.46.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.47.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.47.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.47.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.48.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.48.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.48.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.49.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.49.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.49.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.50.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.50.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.50.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.51.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.51.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.51.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.52.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.52.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.52.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.53.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.53.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.53.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.54.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.54.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.54.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.55.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.55.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.55.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.56.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.56.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.56.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.57.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.57.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.57.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.58.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.58.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.58.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.59.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.59.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.59.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.60.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.60.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.60.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.61.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.61.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.61.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.62.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.62.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.62.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.63.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.63.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.63.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.64.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.64.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.64.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.65.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.65.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.65.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.66.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.66.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.66.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.67.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.67.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.67.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.68.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.68.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.68.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.69.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.69.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.69.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.70.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.70.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.70.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.71.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.71.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.71.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.72.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.72.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.72.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.73.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.73.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.73.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.74.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.74.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.74.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.75.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.75.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.75.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.76.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.76.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.76.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.77.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.77.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.77.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.78.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.78.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.78.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.79.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.79.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.79.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.80.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.80.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.80.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.81.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.81.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.81.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.82.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.82.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.82.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.83.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.83.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.83.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.84.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.84.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.84.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.85.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.85.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.85.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.86.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.86.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.86.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.87.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.87.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.87.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.88.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.88.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.88.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.89.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.89.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.89.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.90.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.90.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.90.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.91.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.91.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.91.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.92.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.92.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.92.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.93.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.93.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.93.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.94.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.94.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.94.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.95.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.95.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.95.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.96.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.96.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.96.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.97.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.97.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.97.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.98.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.98.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.98.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.99.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.99.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.99.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.100.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.100.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.100.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.101.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.101.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.101.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.102.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.102.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.102.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.103.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.103.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.103.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.104.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.104.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.104.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.105.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.105.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.105.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.106.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.106.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.106.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.107.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.107.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.107.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.108.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.108.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.108.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.109.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.109.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.109.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.110.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.110.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.110.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.111.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.111.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.111.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.112.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.112.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.112.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.113.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.113.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.113.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.114.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.114.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.114.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.115.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.115.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.115.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.116.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.116.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.116.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.117.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.117.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.117.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.118.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.118.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.118.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.119.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.119.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.119.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.120.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.120.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.120.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.121.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.121.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.121.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.122.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.122.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.122.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.123.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.123.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.123.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.124.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.124.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.124.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.125.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.125.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.125.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.126.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.126.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.126.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.127.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.127.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.127.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.128.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.128.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.128.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.129.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.129.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.129.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.130.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.130.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.130.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.131.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.131.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.131.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.132.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.132.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.132.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.133.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.133.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.133.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.134.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.134.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.134.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.135.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.135.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.135.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.136.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.136.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.136.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.137.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.137.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.137.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.138.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.138.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.138.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.139.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.139.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.139.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.140.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.140.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.140.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.141.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.141.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.141.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.142.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.142.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.142.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.143.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.143.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.143.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.144.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.144.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.144.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.145.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.145.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.145.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.146.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.146.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.146.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.147.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.147.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.147.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.148.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.148.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.148.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.149.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.149.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.149.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.150.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.150.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.150.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.151.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.151.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.151.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.152.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.152.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.152.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.153.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.153.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.153.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.154.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.154.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.154.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.155.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.155.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.155.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.156.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.156.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.156.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.157.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.157.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.157.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.158.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.158.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.158.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.159.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.159.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.159.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.160.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.160.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.160.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.161.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.161.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.161.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.162.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.162.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.162.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.163.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.163.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.163.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.164.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.164.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.164.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.165.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.165.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.165.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.166.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.166.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.166.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.167.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.167.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.167.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.168.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.168.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.168.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.169.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.169.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.169.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.170.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.170.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.170.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.171.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.171.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.171.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.172.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.172.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.172.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.173.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.173.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.173.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.174.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.174.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.174.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.175.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.175.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.175.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.176.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.176.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.176.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.177.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.177.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.177.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.178.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.178.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.178.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.179.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.179.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.179.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.180.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.180.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.180.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.181.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.181.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.181.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.182.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.182.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.182.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.183.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.183.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.183.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.184.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.184.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.184.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.185.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.185.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.185.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.186.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.186.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.186.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.187.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.187.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.187.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.188.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.188.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.188.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.189.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.189.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.189.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.190.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.190.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.190.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.191.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.191.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.191.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.192.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.192.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.192.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.193.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.193.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.193.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.194.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.194.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.194.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.195.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.195.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.195.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.196.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.196.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.196.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.197.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.197.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.197.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.198.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.198.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.198.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.199.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.199.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.199.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.200.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.200.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.200.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.201.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.201.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.201.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.202.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.202.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.202.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.203.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.203.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.203.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.204.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.204.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.204.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.205.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.205.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.205.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.206.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.206.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.206.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.207.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.207.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.207.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.208.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.208.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.208.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.209.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.209.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.209.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.210.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.210.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.210.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.211.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.211.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.211.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.212.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.212.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.212.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.213.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.213.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.213.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.214.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.214.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.214.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.215.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.215.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.215.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.216.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.216.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.216.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.217.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.217.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.217.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.218.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.218.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.218.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.219.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.219.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.219.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.220.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.220.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.220.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.221.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.221.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.221.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.222.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.222.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.222.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.223.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.223.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.223.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.224.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.224.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.224.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.225.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.225.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.225.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.226.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.226.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.226.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.227.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.227.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.227.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.228.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.228.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.228.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.229.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.229.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.229.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.230.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.230.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.230.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.231.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.231.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.231.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.232.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.232.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.232.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.233.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.233.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.233.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.234.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.234.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.234.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.235.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.235.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.235.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.236.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.236.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.236.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.237.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.237.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.237.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.238.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.238.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.238.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.239.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.239.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.239.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.240.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.240.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.240.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.241.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.241.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.241.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.242.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.242.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.242.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.243.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.243.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.243.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.244.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.244.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.244.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.245.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.245.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.245.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.246.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.246.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.246.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.247.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.247.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.247.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.248.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.248.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.248.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.249.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.249.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.249.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.250.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.250.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.250.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.251.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.251.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.251.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.252.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.252.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.252.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.253.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.253.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.253.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.254.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.254.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.254.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.255.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.255.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.255.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.input_layernorm.weight": "model-00034-of-000163.safetensors", + "model.layers.14.post_attention_layernorm.weight": "model-00034-of-000163.safetensors", + "model.layers.15.self_attn.q_a_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.self_attn.q_a_layernorm.weight": "model-00035-of-000163.safetensors", + "model.layers.15.self_attn.q_b_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.self_attn.kv_a_proj_with_mqa.weight": "model-00035-of-000163.safetensors", + "model.layers.15.self_attn.kv_a_layernorm.weight": "model-00035-of-000163.safetensors", + "model.layers.15.self_attn.kv_b_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.self_attn.o_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.gate.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.gate.e_score_correction_bias": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.shared_experts.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.shared_experts.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.shared_experts.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.0.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.0.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.0.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.1.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.1.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.1.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.2.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.2.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.2.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.3.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.3.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.3.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.4.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.4.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.4.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.5.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.5.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.5.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.6.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.6.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.6.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.7.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.7.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.7.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.8.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.8.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.8.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.9.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.9.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.9.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.10.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.10.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.10.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.11.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.11.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.11.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.12.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.12.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.12.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.13.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.13.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.13.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.14.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.14.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.14.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.15.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.15.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.15.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.16.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.16.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.16.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.17.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.17.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.17.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.18.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.18.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.18.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.19.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.19.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.19.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.20.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.20.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.20.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.21.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.21.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.21.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.22.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.22.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.22.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.23.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.23.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.23.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.24.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.24.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.24.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.25.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.25.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.25.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.26.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.26.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.26.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.27.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.27.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.27.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.28.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.28.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.28.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.29.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.29.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.29.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.30.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.30.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.30.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.31.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.31.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.31.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.32.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.32.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.32.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.33.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.33.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.33.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.34.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.34.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.34.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.35.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.35.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.35.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.36.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.36.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.36.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.37.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.37.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.37.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.38.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.38.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.38.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.39.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.39.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.39.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.40.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.40.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.40.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.41.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.41.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.41.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.42.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.42.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.42.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.43.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.43.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.43.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.44.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.44.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.44.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.45.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.45.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.45.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.46.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.46.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.46.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.47.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.47.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.47.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.48.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.48.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.48.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.49.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.49.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.49.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.50.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.50.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.50.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.51.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.51.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.51.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.52.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.52.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.52.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.53.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.53.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.53.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.54.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.54.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.54.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.55.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.55.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.55.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.56.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.56.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.56.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.57.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.57.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.57.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.58.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.58.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.58.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.59.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.59.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.59.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.60.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.60.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.60.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.61.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.61.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.61.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.62.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.62.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.62.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.63.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.63.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.63.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.64.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.64.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.64.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.65.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.65.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.65.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.66.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.66.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.66.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.67.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.67.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.67.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.68.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.68.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.68.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.69.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.69.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.69.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.70.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.70.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.70.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.71.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.71.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.71.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.72.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.72.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.72.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.73.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.73.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.73.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.74.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.74.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.74.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.75.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.75.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.75.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.76.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.76.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.76.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.77.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.77.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.77.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.78.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.78.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.78.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.79.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.79.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.79.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.80.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.80.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.80.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.81.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.81.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.81.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.82.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.82.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.82.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.83.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.83.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.83.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.84.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.84.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.84.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.85.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.85.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.85.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.86.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.86.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.86.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.87.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.87.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.87.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.88.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.88.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.88.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.89.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.89.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.89.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.90.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.90.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.90.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.91.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.91.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.91.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.92.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.92.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.92.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.93.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.93.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.93.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.94.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.94.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.94.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.95.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.95.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.95.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.96.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.96.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.96.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.97.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.97.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.97.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.98.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.98.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.98.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.99.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.99.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.99.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.100.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.100.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.100.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.101.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.101.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.101.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.102.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.102.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.102.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.103.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.103.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.103.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.104.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.104.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.104.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.105.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.105.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.105.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.106.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.106.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.106.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.107.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.107.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.107.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.108.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.108.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.108.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.109.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.109.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.109.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.110.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.110.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.110.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.111.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.111.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.111.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.112.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.112.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.112.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.113.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.113.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.113.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.114.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.114.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.114.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.115.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.115.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.115.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.116.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.116.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.116.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.117.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.117.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.117.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.118.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.118.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.118.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.119.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.119.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.119.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.120.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.120.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.120.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.121.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.121.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.121.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.122.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.122.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.122.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.123.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.123.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.123.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.124.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.124.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.124.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.125.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.125.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.125.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.126.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.126.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.126.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.127.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.127.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.127.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.128.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.128.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.128.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.129.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.129.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.129.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.130.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.130.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.130.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.131.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.131.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.131.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.132.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.132.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.132.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.133.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.133.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.133.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.134.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.134.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.134.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.135.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.135.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.135.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.136.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.136.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.136.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.137.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.137.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.137.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.138.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.138.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.138.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.139.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.139.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.139.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.140.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.140.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.140.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.141.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.141.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.141.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.142.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.142.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.142.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.143.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.143.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.143.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.144.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.144.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.144.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.145.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.145.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.145.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.146.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.146.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.146.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.147.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.147.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.147.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.148.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.148.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.148.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.149.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.149.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.149.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.150.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.150.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.150.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.151.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.151.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.151.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.152.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.152.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.152.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.153.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.153.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.153.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.154.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.154.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.154.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.155.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.155.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.155.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.156.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.156.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.156.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.157.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.157.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.157.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.158.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.158.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.158.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.159.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.159.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.159.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.160.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.160.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.160.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.161.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.161.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.161.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.162.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.162.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.162.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.163.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.163.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.163.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.164.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.164.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.164.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.165.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.165.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.165.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.166.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.166.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.166.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.167.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.167.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.167.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.168.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.168.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.168.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.169.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.169.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.169.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.170.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.170.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.170.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.171.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.171.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.171.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.172.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.172.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.172.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.173.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.173.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.173.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.174.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.174.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.174.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.175.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.175.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.175.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.176.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.176.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.176.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.177.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.177.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.177.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.178.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.178.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.178.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.179.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.179.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.179.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.180.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.180.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.180.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.181.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.181.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.181.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.182.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.182.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.182.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.183.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.183.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.183.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.184.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.184.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.184.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.185.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.185.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.185.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.186.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.186.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.186.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.187.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.187.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.187.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.188.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.188.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.188.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.189.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.189.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.189.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.190.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.190.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.190.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.191.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.191.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.191.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.192.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.192.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.192.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.193.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.193.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.193.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.194.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.194.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.194.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.195.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.195.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.195.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.196.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.196.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.196.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.197.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.197.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.197.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.198.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.198.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.198.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.199.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.199.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.199.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.200.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.200.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.200.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.201.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.201.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.201.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.202.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.202.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.202.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.203.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.203.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.203.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.204.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.204.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.204.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.205.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.205.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.205.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.206.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.206.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.206.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.207.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.207.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.207.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.208.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.208.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.208.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.209.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.209.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.209.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.210.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.210.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.210.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.211.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.211.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.211.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.212.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.212.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.212.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.213.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.213.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.213.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.214.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.214.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.214.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.215.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.215.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.215.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.216.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.216.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.216.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.217.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.217.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.217.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.218.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.218.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.218.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.219.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.219.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.219.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.220.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.220.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.220.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.221.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.221.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.221.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.222.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.222.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.222.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.223.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.223.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.223.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.224.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.224.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.224.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.225.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.225.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.225.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.226.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.226.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.226.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.227.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.227.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.227.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.228.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.228.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.228.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.229.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.229.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.229.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.230.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.230.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.230.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.231.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.231.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.231.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.232.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.232.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.232.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.233.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.233.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.233.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.234.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.234.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.234.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.235.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.235.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.235.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.236.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.236.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.236.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.237.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.237.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.237.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.238.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.238.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.238.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.239.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.239.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.239.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.240.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.240.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.240.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.241.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.241.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.241.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.242.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.242.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.242.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.243.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.243.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.243.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.244.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.244.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.244.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.245.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.245.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.245.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.246.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.246.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.246.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.247.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.247.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.247.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.248.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.248.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.248.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.249.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.249.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.249.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.250.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.250.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.250.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.251.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.251.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.251.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.252.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.252.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.252.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.253.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.253.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.253.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.254.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.254.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.254.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.255.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.255.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.255.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.input_layernorm.weight": "model-00037-of-000163.safetensors", + "model.layers.15.post_attention_layernorm.weight": "model-00037-of-000163.safetensors", + "model.layers.16.self_attn.q_a_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.self_attn.q_a_layernorm.weight": "model-00037-of-000163.safetensors", + "model.layers.16.self_attn.q_b_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.self_attn.kv_a_proj_with_mqa.weight": "model-00037-of-000163.safetensors", + "model.layers.16.self_attn.kv_a_layernorm.weight": "model-00037-of-000163.safetensors", + "model.layers.16.self_attn.kv_b_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.self_attn.o_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.gate.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.gate.e_score_correction_bias": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.shared_experts.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.shared_experts.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.shared_experts.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.0.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.0.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.0.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.1.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.1.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.1.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.2.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.2.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.2.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.3.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.3.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.3.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.4.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.4.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.4.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.5.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.5.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.5.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.6.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.6.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.6.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.7.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.7.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.7.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.8.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.8.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.8.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.9.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.9.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.9.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.10.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.10.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.10.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.11.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.11.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.11.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.12.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.12.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.12.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.13.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.13.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.13.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.14.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.14.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.14.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.15.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.15.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.15.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.16.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.16.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.16.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.17.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.17.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.17.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.18.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.18.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.18.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.19.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.19.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.19.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.20.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.20.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.20.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.21.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.21.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.21.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.22.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.22.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.22.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.23.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.23.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.23.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.24.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.24.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.24.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.25.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.25.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.25.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.26.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.26.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.26.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.27.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.27.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.27.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.28.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.28.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.28.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.29.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.29.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.29.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.30.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.30.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.30.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.31.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.31.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.31.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.32.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.32.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.32.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.33.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.33.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.33.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.34.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.34.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.34.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.35.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.35.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.35.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.36.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.36.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.36.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.37.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.37.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.37.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.38.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.38.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.38.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.39.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.39.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.39.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.40.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.40.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.40.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.41.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.41.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.41.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.42.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.42.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.42.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.43.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.43.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.43.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.44.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.44.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.44.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.45.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.45.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.45.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.46.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.46.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.46.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.47.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.47.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.47.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.48.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.48.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.48.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.49.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.49.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.49.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.50.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.50.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.50.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.51.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.51.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.51.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.52.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.52.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.52.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.53.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.53.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.53.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.54.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.54.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.54.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.55.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.55.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.55.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.56.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.56.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.56.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.57.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.57.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.57.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.58.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.58.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.58.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.59.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.59.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.59.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.60.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.60.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.60.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.61.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.61.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.61.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.62.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.62.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.62.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.63.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.63.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.63.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.64.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.64.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.64.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.65.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.65.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.65.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.66.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.66.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.66.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.67.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.67.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.67.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.68.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.68.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.68.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.69.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.69.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.69.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.70.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.70.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.70.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.71.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.71.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.71.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.72.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.72.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.72.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.73.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.73.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.73.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.74.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.74.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.74.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.75.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.75.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.75.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.76.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.76.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.76.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.77.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.77.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.77.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.78.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.78.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.78.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.79.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.79.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.79.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.80.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.80.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.80.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.81.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.81.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.81.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.82.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.82.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.82.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.83.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.83.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.83.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.84.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.84.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.84.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.85.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.85.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.85.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.86.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.86.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.86.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.87.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.87.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.87.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.88.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.88.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.88.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.89.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.89.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.89.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.90.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.90.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.90.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.91.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.91.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.91.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.92.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.92.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.92.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.93.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.93.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.93.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.94.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.94.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.94.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.95.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.95.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.95.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.96.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.96.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.96.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.97.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.97.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.97.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.98.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.98.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.98.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.99.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.99.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.99.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.100.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.100.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.100.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.101.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.101.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.101.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.102.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.102.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.102.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.103.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.103.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.103.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.104.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.104.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.104.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.105.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.105.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.105.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.106.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.106.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.106.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.107.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.107.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.107.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.108.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.108.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.108.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.109.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.109.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.109.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.110.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.110.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.110.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.111.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.111.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.111.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.112.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.112.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.112.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.113.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.113.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.113.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.114.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.114.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.114.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.115.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.115.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.115.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.116.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.116.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.116.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.117.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.117.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.117.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.118.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.118.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.118.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.119.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.119.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.119.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.120.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.120.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.120.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.121.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.121.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.121.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.122.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.122.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.122.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.123.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.123.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.123.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.124.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.124.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.124.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.125.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.125.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.125.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.126.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.126.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.126.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.127.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.127.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.127.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.128.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.128.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.128.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.129.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.129.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.129.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.130.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.130.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.130.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.131.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.131.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.131.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.132.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.132.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.132.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.133.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.133.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.133.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.134.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.134.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.134.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.135.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.135.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.135.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.136.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.136.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.136.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.137.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.137.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.137.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.138.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.138.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.138.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.139.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.139.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.139.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.140.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.140.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.140.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.141.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.141.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.141.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.142.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.142.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.142.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.143.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.143.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.143.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.144.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.144.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.144.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.145.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.145.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.145.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.146.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.146.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.146.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.147.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.147.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.147.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.148.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.148.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.148.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.149.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.149.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.149.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.150.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.150.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.150.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.151.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.151.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.151.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.152.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.152.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.152.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.153.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.153.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.153.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.154.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.154.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.154.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.155.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.155.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.155.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.156.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.156.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.156.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.157.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.157.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.157.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.158.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.158.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.158.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.159.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.159.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.159.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.160.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.160.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.160.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.161.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.161.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.161.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.162.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.162.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.162.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.163.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.163.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.163.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.164.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.164.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.164.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.165.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.165.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.165.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.166.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.166.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.166.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.167.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.167.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.167.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.168.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.168.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.168.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.169.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.169.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.169.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.170.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.170.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.170.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.171.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.171.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.171.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.172.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.172.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.172.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.173.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.173.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.173.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.174.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.174.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.174.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.175.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.175.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.175.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.176.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.176.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.176.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.177.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.177.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.177.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.178.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.178.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.178.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.179.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.179.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.179.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.180.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.180.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.180.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.181.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.181.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.181.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.182.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.182.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.182.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.183.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.183.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.183.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.184.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.184.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.184.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.185.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.185.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.185.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.186.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.186.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.186.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.187.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.187.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.187.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.188.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.188.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.188.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.189.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.189.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.189.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.190.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.190.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.190.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.191.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.191.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.191.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.192.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.192.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.192.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.193.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.193.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.193.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.194.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.194.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.194.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.195.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.195.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.195.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.196.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.196.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.196.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.197.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.197.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.197.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.198.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.198.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.198.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.199.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.199.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.199.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.200.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.200.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.200.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.201.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.201.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.201.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.202.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.202.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.202.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.203.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.203.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.203.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.204.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.204.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.204.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.205.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.205.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.205.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.206.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.206.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.206.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.207.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.207.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.207.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.208.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.208.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.208.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.209.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.209.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.209.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.210.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.210.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.210.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.211.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.211.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.211.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.212.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.212.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.212.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.213.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.213.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.213.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.214.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.214.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.214.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.215.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.215.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.215.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.216.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.216.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.216.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.217.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.217.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.217.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.218.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.218.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.218.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.219.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.219.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.219.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.220.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.220.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.220.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.221.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.221.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.221.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.222.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.222.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.222.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.223.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.223.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.223.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.224.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.224.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.224.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.225.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.225.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.225.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.226.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.226.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.226.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.227.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.227.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.227.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.228.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.228.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.228.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.229.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.229.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.229.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.230.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.230.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.230.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.231.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.231.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.231.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.232.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.232.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.232.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.233.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.233.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.233.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.234.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.234.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.234.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.235.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.235.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.235.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.236.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.236.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.236.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.237.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.237.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.237.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.238.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.238.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.238.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.239.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.239.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.239.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.240.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.240.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.240.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.241.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.241.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.241.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.242.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.242.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.242.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.243.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.243.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.243.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.244.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.244.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.244.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.245.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.245.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.245.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.246.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.246.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.246.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.247.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.247.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.247.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.248.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.248.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.248.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.249.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.249.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.249.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.250.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.250.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.250.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.251.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.251.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.251.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.252.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.252.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.252.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.253.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.253.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.253.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.254.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.254.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.254.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.255.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.255.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.255.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.input_layernorm.weight": "model-00040-of-000163.safetensors", + "model.layers.16.post_attention_layernorm.weight": "model-00040-of-000163.safetensors", + "model.layers.17.self_attn.q_a_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.self_attn.q_a_layernorm.weight": "model-00040-of-000163.safetensors", + "model.layers.17.self_attn.q_b_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.self_attn.kv_a_proj_with_mqa.weight": "model-00040-of-000163.safetensors", + "model.layers.17.self_attn.kv_a_layernorm.weight": "model-00040-of-000163.safetensors", + "model.layers.17.self_attn.kv_b_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.self_attn.o_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.gate.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.gate.e_score_correction_bias": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.shared_experts.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.shared_experts.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.shared_experts.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.0.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.0.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.0.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.1.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.1.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.1.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.2.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.2.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.2.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.3.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.3.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.3.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.4.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.4.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.4.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.5.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.5.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.5.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.6.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.6.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.6.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.7.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.7.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.7.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.8.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.8.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.8.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.9.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.9.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.9.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.10.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.10.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.10.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.11.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.11.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.11.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.12.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.12.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.12.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.13.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.13.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.13.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.14.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.14.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.14.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.15.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.15.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.15.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.16.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.16.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.16.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.17.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.17.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.17.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.18.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.18.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.18.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.19.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.19.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.19.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.20.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.20.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.20.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.21.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.21.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.21.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.22.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.22.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.22.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.23.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.23.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.23.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.24.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.24.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.24.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.25.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.25.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.25.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.26.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.26.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.26.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.27.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.27.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.27.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.28.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.28.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.28.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.29.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.29.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.29.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.30.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.30.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.30.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.31.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.31.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.31.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.32.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.32.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.32.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.33.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.33.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.33.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.34.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.34.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.34.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.35.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.35.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.35.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.36.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.36.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.36.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.37.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.37.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.37.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.38.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.38.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.38.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.39.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.39.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.39.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.40.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.40.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.40.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.41.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.41.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.41.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.42.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.42.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.42.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.43.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.43.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.43.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.44.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.44.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.44.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.45.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.45.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.45.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.46.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.46.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.46.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.47.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.47.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.47.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.48.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.48.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.48.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.49.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.49.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.49.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.50.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.50.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.50.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.51.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.51.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.51.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.52.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.52.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.52.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.53.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.53.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.53.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.54.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.54.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.54.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.55.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.55.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.55.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.56.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.56.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.56.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.57.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.57.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.57.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.58.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.58.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.58.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.59.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.59.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.59.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.60.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.60.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.60.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.61.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.61.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.61.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.62.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.62.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.62.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.63.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.63.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.63.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.64.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.64.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.64.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.65.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.65.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.65.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.66.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.66.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.66.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.67.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.67.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.67.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.68.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.68.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.68.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.69.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.69.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.69.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.70.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.70.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.70.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.71.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.71.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.71.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.72.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.72.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.72.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.73.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.73.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.73.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.74.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.74.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.74.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.75.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.75.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.75.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.76.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.76.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.76.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.77.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.77.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.77.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.78.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.78.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.78.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.79.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.79.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.79.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.80.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.80.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.80.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.81.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.81.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.81.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.82.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.82.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.82.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.83.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.83.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.83.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.84.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.84.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.84.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.85.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.85.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.85.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.86.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.86.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.86.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.87.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.87.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.87.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.88.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.88.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.88.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.89.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.89.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.89.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.90.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.90.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.90.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.91.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.91.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.91.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.92.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.92.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.92.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.93.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.93.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.93.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.94.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.94.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.94.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.95.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.95.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.95.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.96.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.96.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.96.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.97.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.97.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.97.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.98.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.98.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.98.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.99.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.99.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.99.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.100.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.100.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.100.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.101.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.101.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.101.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.102.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.102.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.102.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.103.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.103.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.103.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.104.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.104.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.104.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.105.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.105.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.105.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.106.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.106.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.106.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.107.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.107.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.107.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.108.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.108.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.108.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.109.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.109.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.109.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.110.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.110.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.110.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.111.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.111.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.111.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.112.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.112.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.112.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.113.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.113.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.113.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.114.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.114.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.114.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.115.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.115.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.115.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.116.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.116.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.116.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.117.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.117.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.117.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.118.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.118.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.118.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.119.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.119.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.119.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.120.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.120.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.120.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.121.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.121.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.121.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.122.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.122.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.122.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.123.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.123.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.123.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.124.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.124.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.124.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.125.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.125.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.125.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.126.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.126.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.126.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.127.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.127.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.127.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.128.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.128.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.128.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.129.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.129.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.129.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.130.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.130.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.130.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.131.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.131.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.131.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.132.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.132.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.132.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.133.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.133.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.133.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.134.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.134.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.134.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.135.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.135.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.135.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.136.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.136.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.136.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.137.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.137.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.137.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.138.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.138.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.138.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.139.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.139.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.139.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.140.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.140.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.140.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.141.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.141.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.141.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.142.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.142.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.142.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.143.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.143.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.143.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.144.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.144.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.144.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.145.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.145.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.145.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.146.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.146.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.146.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.147.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.147.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.147.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.148.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.148.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.148.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.149.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.149.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.149.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.150.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.150.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.150.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.151.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.151.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.151.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.152.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.152.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.152.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.153.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.153.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.153.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.154.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.154.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.154.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.155.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.155.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.155.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.156.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.156.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.156.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.157.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.157.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.157.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.158.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.158.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.158.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.159.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.159.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.159.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.160.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.160.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.160.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.161.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.161.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.161.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.162.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.162.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.162.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.163.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.163.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.163.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.164.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.164.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.164.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.165.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.165.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.165.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.166.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.166.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.166.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.167.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.167.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.167.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.168.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.168.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.168.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.169.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.169.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.169.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.170.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.170.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.170.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.171.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.171.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.171.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.172.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.172.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.172.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.173.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.173.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.173.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.174.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.174.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.174.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.175.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.175.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.175.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.176.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.176.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.176.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.177.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.177.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.177.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.178.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.178.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.178.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.179.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.179.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.179.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.180.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.180.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.180.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.181.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.181.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.181.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.182.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.182.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.182.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.183.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.183.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.183.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.184.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.184.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.184.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.185.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.185.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.185.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.186.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.186.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.186.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.187.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.187.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.187.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.188.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.188.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.188.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.189.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.189.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.189.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.190.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.190.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.190.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.191.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.191.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.191.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.192.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.192.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.192.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.193.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.193.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.193.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.194.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.194.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.194.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.195.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.195.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.195.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.196.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.196.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.196.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.197.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.197.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.197.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.198.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.198.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.198.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.199.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.199.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.199.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.200.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.200.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.200.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.201.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.201.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.201.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.202.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.202.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.202.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.203.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.203.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.203.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.204.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.204.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.204.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.205.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.205.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.205.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.206.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.206.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.206.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.207.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.207.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.207.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.208.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.208.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.208.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.209.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.209.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.209.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.210.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.210.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.210.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.211.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.211.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.211.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.212.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.212.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.212.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.213.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.213.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.213.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.214.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.214.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.214.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.215.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.215.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.215.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.216.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.216.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.216.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.217.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.217.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.217.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.218.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.218.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.218.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.219.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.219.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.219.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.220.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.220.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.220.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.221.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.221.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.221.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.222.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.222.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.222.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.223.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.223.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.223.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.224.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.224.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.224.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.225.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.225.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.225.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.226.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.226.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.226.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.227.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.227.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.227.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.228.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.228.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.228.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.229.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.229.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.229.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.230.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.230.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.230.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.231.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.231.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.231.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.232.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.232.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.232.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.233.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.233.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.233.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.234.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.234.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.234.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.235.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.235.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.235.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.236.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.236.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.236.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.237.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.237.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.237.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.238.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.238.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.238.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.239.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.239.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.239.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.240.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.240.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.240.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.241.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.241.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.241.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.242.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.242.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.242.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.243.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.243.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.243.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.244.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.244.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.244.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.245.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.245.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.245.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.246.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.246.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.246.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.247.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.247.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.247.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.248.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.248.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.248.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.249.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.249.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.249.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.250.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.250.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.250.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.251.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.251.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.251.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.252.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.252.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.252.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.253.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.253.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.17.mlp.experts.253.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.17.mlp.experts.254.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.17.mlp.experts.254.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.17.mlp.experts.254.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.17.mlp.experts.255.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.17.mlp.experts.255.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.17.mlp.experts.255.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.17.input_layernorm.weight": "model-00043-of-000163.safetensors", + "model.layers.17.post_attention_layernorm.weight": "model-00043-of-000163.safetensors", + "model.layers.18.self_attn.q_a_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.self_attn.q_a_layernorm.weight": "model-00043-of-000163.safetensors", + "model.layers.18.self_attn.q_b_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.self_attn.kv_a_proj_with_mqa.weight": "model-00043-of-000163.safetensors", + "model.layers.18.self_attn.kv_a_layernorm.weight": "model-00043-of-000163.safetensors", + "model.layers.18.self_attn.kv_b_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.self_attn.o_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.gate.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.gate.e_score_correction_bias": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.shared_experts.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.shared_experts.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.shared_experts.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.0.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.0.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.0.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.1.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.1.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.1.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.2.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.2.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.2.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.3.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.3.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.3.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.4.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.4.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.4.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.5.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.5.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.5.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.6.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.6.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.6.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.7.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.7.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.7.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.8.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.8.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.8.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.9.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.9.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.9.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.10.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.10.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.10.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.11.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.11.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.11.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.12.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.12.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.12.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.13.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.13.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.13.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.14.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.14.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.14.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.15.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.15.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.15.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.16.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.16.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.16.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.17.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.17.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.17.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.18.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.18.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.18.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.19.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.19.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.19.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.20.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.20.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.20.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.21.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.21.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.21.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.22.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.22.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.22.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.23.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.23.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.23.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.24.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.24.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.24.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.25.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.25.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.25.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.26.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.26.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.26.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.27.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.27.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.27.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.28.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.28.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.28.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.29.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.29.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.29.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.30.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.30.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.30.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.31.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.31.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.31.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.32.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.32.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.32.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.33.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.33.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.33.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.34.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.34.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.34.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.35.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.35.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.35.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.36.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.36.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.36.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.37.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.37.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.37.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.38.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.38.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.38.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.39.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.39.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.39.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.40.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.40.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.40.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.41.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.41.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.41.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.42.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.42.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.42.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.43.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.43.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.43.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.44.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.44.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.44.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.45.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.45.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.45.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.46.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.46.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.46.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.47.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.47.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.47.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.48.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.48.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.48.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.49.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.49.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.49.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.50.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.50.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.50.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.51.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.51.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.51.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.52.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.52.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.52.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.53.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.53.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.53.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.54.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.54.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.54.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.55.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.55.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.55.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.56.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.56.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.56.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.57.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.57.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.57.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.58.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.58.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.58.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.59.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.59.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.59.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.60.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.60.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.60.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.61.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.61.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.61.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.62.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.62.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.62.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.63.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.63.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.63.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.64.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.64.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.64.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.65.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.65.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.65.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.66.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.66.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.66.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.67.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.67.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.67.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.68.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.68.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.68.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.69.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.69.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.69.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.70.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.70.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.70.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.71.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.71.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.71.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.72.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.72.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.72.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.73.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.73.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.73.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.74.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.74.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.74.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.75.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.75.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.75.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.76.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.76.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.76.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.77.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.77.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.77.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.78.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.78.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.78.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.79.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.79.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.79.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.80.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.80.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.80.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.81.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.81.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.81.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.82.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.82.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.82.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.83.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.83.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.83.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.84.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.84.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.84.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.85.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.85.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.85.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.86.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.86.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.86.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.87.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.87.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.87.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.88.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.88.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.88.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.89.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.89.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.89.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.90.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.90.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.90.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.91.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.91.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.91.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.92.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.92.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.92.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.93.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.93.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.93.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.94.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.94.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.94.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.95.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.95.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.95.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.96.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.96.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.96.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.97.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.97.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.97.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.98.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.98.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.98.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.99.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.99.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.99.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.100.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.100.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.100.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.101.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.101.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.101.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.102.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.102.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.102.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.103.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.103.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.103.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.104.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.104.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.104.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.105.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.105.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.105.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.106.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.106.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.106.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.107.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.107.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.107.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.108.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.108.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.108.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.109.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.109.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.109.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.110.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.110.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.110.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.111.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.111.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.111.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.112.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.112.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.112.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.113.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.113.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.113.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.114.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.114.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.114.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.115.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.115.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.115.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.116.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.116.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.116.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.117.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.117.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.117.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.118.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.118.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.118.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.119.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.119.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.119.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.120.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.120.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.120.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.121.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.121.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.121.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.122.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.122.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.122.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.123.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.123.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.123.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.124.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.124.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.124.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.125.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.125.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.125.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.126.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.126.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.126.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.127.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.127.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.127.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.128.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.128.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.128.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.129.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.129.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.129.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.130.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.130.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.130.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.131.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.131.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.131.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.132.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.132.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.132.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.133.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.133.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.133.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.134.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.134.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.134.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.135.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.135.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.135.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.136.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.136.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.136.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.137.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.137.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.137.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.138.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.138.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.138.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.139.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.139.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.139.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.140.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.140.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.140.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.141.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.141.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.141.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.142.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.142.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.142.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.143.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.143.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.143.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.144.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.144.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.144.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.145.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.145.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.145.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.146.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.146.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.146.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.147.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.147.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.147.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.148.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.148.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.148.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.149.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.149.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.149.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.150.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.150.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.150.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.151.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.151.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.151.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.152.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.152.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.152.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.153.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.153.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.153.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.154.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.154.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.154.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.155.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.155.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.155.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.156.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.156.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.156.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.157.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.157.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.157.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.158.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.158.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.158.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.159.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.159.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.159.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.160.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.160.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.160.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.161.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.161.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.161.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.162.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.162.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.162.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.163.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.163.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.163.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.164.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.164.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.164.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.165.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.165.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.165.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.166.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.166.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.166.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.167.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.167.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.167.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.168.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.168.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.168.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.169.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.169.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.169.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.170.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.170.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.170.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.171.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.171.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.171.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.172.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.172.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.172.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.173.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.173.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.173.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.174.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.174.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.174.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.175.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.175.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.175.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.176.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.176.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.176.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.177.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.177.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.177.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.178.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.178.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.178.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.179.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.179.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.179.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.180.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.180.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.180.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.181.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.181.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.181.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.182.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.182.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.182.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.183.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.183.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.183.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.184.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.184.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.184.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.185.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.185.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.185.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.186.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.186.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.186.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.187.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.187.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.187.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.188.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.188.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.188.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.189.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.189.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.189.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.190.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.190.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.190.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.191.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.191.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.191.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.192.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.192.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.192.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.193.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.193.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.193.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.194.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.194.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.194.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.195.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.195.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.195.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.196.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.196.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.196.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.197.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.197.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.197.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.198.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.198.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.198.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.199.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.199.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.199.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.200.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.200.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.200.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.201.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.201.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.201.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.202.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.202.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.202.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.203.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.203.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.203.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.204.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.204.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.204.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.205.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.205.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.205.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.206.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.206.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.206.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.207.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.207.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.207.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.208.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.208.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.208.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.209.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.209.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.209.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.210.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.210.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.210.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.211.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.211.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.211.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.212.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.212.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.212.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.213.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.213.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.213.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.214.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.214.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.214.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.215.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.215.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.215.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.216.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.216.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.216.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.217.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.217.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.217.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.218.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.218.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.218.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.219.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.219.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.219.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.220.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.220.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.220.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.221.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.221.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.221.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.222.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.222.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.222.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.223.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.223.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.223.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.224.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.224.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.224.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.225.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.225.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.225.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.226.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.226.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.226.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.227.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.227.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.227.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.228.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.228.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.228.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.229.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.229.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.229.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.230.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.230.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.230.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.231.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.231.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.231.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.232.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.232.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.232.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.233.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.233.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.233.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.234.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.234.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.234.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.235.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.235.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.235.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.236.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.236.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.236.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.237.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.237.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.237.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.238.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.238.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.238.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.239.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.239.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.239.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.240.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.240.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.240.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.241.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.241.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.241.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.242.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.242.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.242.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.243.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.243.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.243.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.244.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.244.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.244.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.245.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.245.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.245.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.246.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.246.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.246.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.247.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.247.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.247.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.248.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.248.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.248.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.249.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.249.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.249.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.250.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.250.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.250.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.251.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.251.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.251.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.252.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.252.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.252.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.253.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.253.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.253.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.254.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.254.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.254.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.255.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.255.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.255.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.input_layernorm.weight": "model-00045-of-000163.safetensors", + "model.layers.18.post_attention_layernorm.weight": "model-00045-of-000163.safetensors", + "model.layers.19.self_attn.q_a_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.self_attn.q_a_layernorm.weight": "model-00045-of-000163.safetensors", + "model.layers.19.self_attn.q_b_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.self_attn.kv_a_proj_with_mqa.weight": "model-00045-of-000163.safetensors", + "model.layers.19.self_attn.kv_a_layernorm.weight": "model-00045-of-000163.safetensors", + "model.layers.19.self_attn.kv_b_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.self_attn.o_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.gate.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.gate.e_score_correction_bias": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.shared_experts.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.shared_experts.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.shared_experts.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.0.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.0.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.0.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.1.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.1.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.1.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.2.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.2.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.2.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.3.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.3.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.3.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.4.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.4.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.4.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.5.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.5.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.5.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.6.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.6.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.6.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.7.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.7.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.7.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.8.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.8.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.8.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.9.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.9.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.9.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.10.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.10.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.10.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.11.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.11.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.11.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.12.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.12.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.12.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.13.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.13.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.13.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.14.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.14.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.14.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.15.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.15.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.15.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.16.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.16.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.16.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.17.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.17.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.17.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.18.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.18.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.18.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.19.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.19.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.19.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.20.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.20.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.20.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.21.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.21.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.21.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.22.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.22.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.22.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.23.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.23.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.23.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.24.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.24.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.24.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.25.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.25.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.25.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.26.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.26.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.26.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.27.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.27.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.27.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.28.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.28.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.28.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.29.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.29.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.29.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.30.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.30.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.30.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.31.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.31.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.31.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.32.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.32.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.32.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.33.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.33.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.33.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.34.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.34.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.34.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.35.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.35.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.35.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.36.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.36.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.36.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.37.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.37.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.37.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.38.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.38.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.38.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.39.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.39.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.39.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.40.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.40.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.40.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.41.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.41.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.41.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.42.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.42.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.42.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.43.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.43.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.43.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.44.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.44.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.44.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.45.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.45.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.45.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.46.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.46.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.46.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.47.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.47.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.47.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.48.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.48.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.48.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.49.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.49.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.49.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.50.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.50.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.50.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.51.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.51.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.51.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.52.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.52.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.52.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.53.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.53.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.53.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.54.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.54.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.54.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.55.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.55.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.55.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.56.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.56.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.56.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.57.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.57.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.57.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.58.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.58.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.58.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.59.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.59.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.59.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.60.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.60.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.60.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.61.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.61.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.61.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.62.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.62.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.62.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.63.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.63.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.63.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.64.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.64.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.64.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.65.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.65.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.65.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.66.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.66.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.66.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.67.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.67.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.67.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.68.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.68.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.68.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.69.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.69.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.69.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.70.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.70.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.70.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.71.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.71.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.71.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.72.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.72.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.72.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.73.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.73.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.73.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.74.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.74.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.74.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.75.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.75.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.75.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.76.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.76.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.76.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.77.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.77.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.77.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.78.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.78.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.78.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.79.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.79.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.79.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.80.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.80.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.80.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.81.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.81.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.81.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.82.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.82.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.82.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.83.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.83.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.83.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.84.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.84.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.84.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.85.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.85.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.85.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.86.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.86.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.86.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.87.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.87.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.87.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.88.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.88.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.88.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.89.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.89.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.89.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.90.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.90.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.90.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.91.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.91.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.91.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.92.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.92.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.92.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.93.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.93.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.93.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.94.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.94.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.94.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.95.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.95.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.95.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.96.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.96.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.96.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.97.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.97.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.97.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.98.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.98.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.98.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.99.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.99.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.99.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.100.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.100.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.100.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.101.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.101.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.101.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.102.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.102.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.102.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.103.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.103.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.103.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.104.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.104.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.104.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.105.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.105.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.105.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.106.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.106.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.106.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.107.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.107.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.107.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.108.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.108.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.108.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.109.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.109.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.109.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.110.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.110.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.110.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.111.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.111.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.111.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.112.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.112.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.112.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.113.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.113.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.113.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.114.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.114.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.114.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.115.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.115.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.115.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.116.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.116.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.116.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.117.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.117.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.117.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.118.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.118.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.118.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.119.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.119.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.119.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.120.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.120.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.120.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.121.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.121.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.121.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.122.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.122.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.122.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.123.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.123.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.123.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.124.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.124.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.124.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.125.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.125.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.125.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.126.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.126.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.126.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.127.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.127.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.127.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.128.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.128.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.128.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.129.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.129.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.129.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.130.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.130.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.130.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.131.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.131.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.131.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.132.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.132.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.132.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.133.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.133.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.133.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.134.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.134.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.134.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.135.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.135.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.135.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.136.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.136.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.136.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.137.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.137.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.137.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.138.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.138.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.138.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.139.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.139.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.139.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.140.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.140.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.140.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.141.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.141.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.141.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.142.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.142.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.142.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.143.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.143.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.143.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.144.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.144.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.144.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.145.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.145.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.145.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.146.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.146.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.146.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.147.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.147.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.147.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.148.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.148.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.148.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.149.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.149.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.149.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.150.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.150.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.150.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.151.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.151.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.151.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.152.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.152.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.152.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.153.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.153.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.153.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.154.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.154.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.154.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.155.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.155.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.155.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.156.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.156.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.156.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.157.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.157.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.157.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.158.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.158.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.158.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.159.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.159.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.159.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.160.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.160.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.160.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.161.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.161.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.161.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.162.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.162.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.162.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.163.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.163.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.163.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.164.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.164.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.164.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.165.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.165.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.165.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.166.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.166.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.166.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.167.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.167.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.167.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.168.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.168.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.168.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.169.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.169.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.169.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.170.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.170.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.170.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.171.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.171.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.171.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.172.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.172.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.172.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.173.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.173.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.173.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.174.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.174.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.174.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.175.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.175.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.175.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.176.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.176.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.176.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.177.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.177.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.177.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.178.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.178.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.178.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.179.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.179.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.179.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.180.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.180.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.180.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.181.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.181.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.181.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.182.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.182.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.182.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.183.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.183.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.183.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.184.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.184.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.184.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.185.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.185.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.185.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.186.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.186.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.186.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.187.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.187.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.187.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.188.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.188.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.188.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.189.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.189.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.189.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.190.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.190.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.190.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.191.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.191.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.191.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.192.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.192.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.192.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.193.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.193.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.193.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.194.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.194.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.194.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.195.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.195.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.195.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.196.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.196.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.196.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.197.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.197.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.197.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.198.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.198.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.198.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.199.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.199.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.199.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.200.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.200.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.200.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.201.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.201.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.201.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.202.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.202.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.202.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.203.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.203.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.203.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.204.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.204.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.204.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.205.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.205.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.205.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.206.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.206.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.206.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.207.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.207.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.207.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.208.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.208.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.208.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.209.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.209.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.209.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.210.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.210.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.210.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.211.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.211.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.211.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.212.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.212.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.212.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.213.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.213.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.213.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.214.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.214.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.214.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.215.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.215.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.215.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.216.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.216.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.216.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.217.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.217.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.217.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.218.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.218.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.218.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.219.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.219.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.219.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.220.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.220.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.220.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.221.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.221.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.221.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.222.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.222.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.222.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.223.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.223.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.223.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.224.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.224.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.224.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.225.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.225.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.225.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.226.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.226.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.226.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.227.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.227.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.227.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.228.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.228.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.228.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.229.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.229.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.229.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.230.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.230.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.230.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.231.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.231.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.231.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.232.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.232.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.232.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.233.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.233.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.233.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.234.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.234.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.234.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.235.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.235.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.235.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.236.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.236.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.236.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.237.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.237.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.237.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.238.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.238.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.238.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.239.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.239.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.239.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.240.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.240.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.240.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.241.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.241.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.241.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.242.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.242.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.242.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.243.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.243.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.243.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.244.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.244.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.244.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.245.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.245.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.245.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.246.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.246.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.246.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.247.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.247.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.247.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.248.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.248.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.248.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.249.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.249.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.249.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.250.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.250.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.250.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.251.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.251.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.251.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.252.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.252.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.252.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.253.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.253.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.253.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.254.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.254.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.254.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.255.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.255.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.255.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.input_layernorm.weight": "model-00048-of-000163.safetensors", + "model.layers.19.post_attention_layernorm.weight": "model-00048-of-000163.safetensors", + "model.layers.20.self_attn.q_a_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.self_attn.q_a_layernorm.weight": "model-00048-of-000163.safetensors", + "model.layers.20.self_attn.q_b_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.self_attn.kv_a_proj_with_mqa.weight": "model-00048-of-000163.safetensors", + "model.layers.20.self_attn.kv_a_layernorm.weight": "model-00048-of-000163.safetensors", + "model.layers.20.self_attn.kv_b_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.self_attn.o_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.gate.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.gate.e_score_correction_bias": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.shared_experts.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.shared_experts.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.shared_experts.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.0.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.0.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.0.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.1.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.1.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.1.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.2.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.2.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.2.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.3.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.3.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.3.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.4.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.4.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.4.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.5.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.5.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.5.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.6.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.6.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.6.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.7.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.7.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.7.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.8.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.8.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.8.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.9.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.9.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.9.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.10.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.10.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.10.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.11.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.11.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.11.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.12.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.12.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.12.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.13.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.13.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.13.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.14.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.14.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.14.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.15.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.15.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.15.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.16.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.16.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.16.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.17.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.17.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.17.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.18.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.18.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.18.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.19.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.19.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.19.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.20.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.20.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.20.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.21.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.21.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.21.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.22.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.22.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.22.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.23.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.23.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.23.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.24.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.24.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.24.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.25.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.25.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.25.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.26.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.26.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.26.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.27.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.27.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.27.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.28.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.28.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.28.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.29.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.29.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.29.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.30.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.30.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.30.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.31.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.31.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.31.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.32.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.32.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.32.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.33.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.33.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.33.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.34.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.34.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.34.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.35.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.35.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.35.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.36.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.36.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.36.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.37.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.37.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.37.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.38.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.38.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.38.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.39.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.39.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.39.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.40.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.40.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.40.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.41.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.41.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.41.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.42.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.42.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.42.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.43.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.43.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.43.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.44.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.44.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.44.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.45.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.45.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.45.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.46.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.46.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.46.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.47.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.47.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.47.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.48.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.48.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.48.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.49.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.49.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.49.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.50.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.50.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.50.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.51.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.51.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.51.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.52.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.52.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.52.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.53.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.53.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.53.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.54.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.54.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.54.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.55.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.55.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.55.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.56.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.56.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.56.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.57.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.57.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.57.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.58.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.58.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.58.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.59.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.59.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.59.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.60.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.60.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.60.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.61.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.61.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.61.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.62.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.62.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.62.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.63.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.63.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.63.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.64.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.64.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.64.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.65.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.65.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.65.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.66.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.66.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.66.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.67.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.67.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.67.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.68.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.68.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.68.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.69.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.69.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.69.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.70.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.70.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.70.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.71.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.71.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.71.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.72.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.72.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.72.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.73.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.73.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.73.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.74.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.74.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.74.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.75.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.75.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.75.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.76.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.76.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.76.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.77.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.77.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.77.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.78.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.78.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.78.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.79.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.79.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.79.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.80.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.80.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.80.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.81.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.81.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.81.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.82.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.82.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.82.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.83.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.83.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.83.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.84.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.84.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.84.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.85.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.85.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.85.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.86.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.86.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.86.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.87.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.87.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.87.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.88.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.88.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.88.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.89.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.89.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.89.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.90.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.90.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.90.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.91.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.91.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.91.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.92.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.92.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.92.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.93.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.93.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.93.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.94.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.94.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.94.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.95.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.95.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.95.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.96.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.96.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.96.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.97.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.97.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.97.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.98.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.98.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.98.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.99.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.99.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.99.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.100.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.100.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.100.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.101.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.101.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.101.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.102.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.102.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.102.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.103.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.103.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.103.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.104.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.104.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.104.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.105.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.105.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.105.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.106.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.106.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.106.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.107.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.107.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.107.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.108.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.108.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.108.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.109.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.109.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.109.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.110.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.110.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.110.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.111.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.111.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.111.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.112.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.112.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.112.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.113.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.113.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.113.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.114.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.114.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.114.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.115.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.115.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.115.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.116.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.116.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.116.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.117.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.117.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.117.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.118.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.118.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.118.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.119.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.119.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.119.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.120.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.120.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.120.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.121.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.121.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.121.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.122.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.122.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.122.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.123.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.123.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.123.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.124.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.124.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.124.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.125.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.125.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.125.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.126.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.126.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.126.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.127.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.127.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.127.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.128.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.128.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.128.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.129.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.129.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.129.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.130.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.130.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.130.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.131.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.131.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.131.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.132.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.132.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.132.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.133.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.133.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.133.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.134.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.134.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.134.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.135.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.135.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.135.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.136.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.136.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.136.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.137.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.137.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.137.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.138.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.138.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.138.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.139.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.139.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.139.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.140.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.140.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.140.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.141.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.141.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.141.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.142.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.142.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.142.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.143.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.143.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.143.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.144.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.144.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.144.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.145.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.145.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.145.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.146.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.146.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.146.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.147.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.147.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.147.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.148.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.148.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.148.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.149.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.149.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.149.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.150.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.150.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.150.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.151.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.151.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.151.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.152.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.152.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.152.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.153.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.153.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.153.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.154.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.154.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.154.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.155.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.155.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.155.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.156.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.156.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.156.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.157.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.157.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.157.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.158.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.158.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.158.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.159.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.159.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.159.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.160.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.160.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.160.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.161.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.161.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.161.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.162.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.162.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.162.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.163.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.163.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.163.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.164.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.164.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.164.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.165.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.165.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.165.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.166.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.166.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.166.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.167.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.167.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.167.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.168.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.168.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.168.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.169.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.169.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.169.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.170.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.170.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.170.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.171.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.171.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.171.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.172.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.172.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.172.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.173.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.173.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.173.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.174.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.174.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.174.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.175.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.175.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.175.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.176.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.176.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.176.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.177.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.177.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.177.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.178.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.178.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.178.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.179.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.179.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.179.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.180.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.180.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.180.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.181.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.181.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.181.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.182.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.182.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.182.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.183.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.183.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.183.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.184.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.184.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.184.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.185.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.185.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.185.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.186.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.186.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.186.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.187.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.187.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.187.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.188.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.188.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.188.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.189.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.189.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.189.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.190.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.190.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.190.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.191.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.191.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.191.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.192.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.192.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.192.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.193.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.193.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.193.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.194.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.194.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.194.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.195.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.195.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.195.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.196.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.196.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.196.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.197.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.197.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.197.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.198.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.198.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.198.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.199.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.199.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.199.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.200.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.200.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.200.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.201.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.201.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.201.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.202.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.202.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.202.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.203.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.203.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.203.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.204.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.204.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.204.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.205.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.205.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.205.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.206.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.206.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.206.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.207.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.207.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.207.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.208.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.208.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.208.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.209.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.209.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.209.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.210.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.210.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.210.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.211.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.211.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.211.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.212.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.212.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.212.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.213.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.213.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.213.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.214.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.214.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.214.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.215.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.215.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.215.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.216.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.216.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.216.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.217.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.217.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.217.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.218.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.218.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.218.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.219.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.219.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.219.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.220.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.220.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.220.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.221.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.221.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.221.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.222.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.222.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.222.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.223.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.223.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.223.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.224.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.224.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.224.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.225.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.225.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.225.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.226.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.226.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.226.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.227.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.227.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.227.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.228.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.228.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.228.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.229.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.229.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.229.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.230.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.230.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.230.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.231.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.231.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.231.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.232.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.232.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.232.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.233.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.233.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.233.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.234.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.234.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.234.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.235.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.235.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.235.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.236.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.236.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.236.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.237.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.237.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.237.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.238.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.238.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.238.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.239.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.239.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.239.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.240.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.240.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.240.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.241.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.241.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.241.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.242.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.242.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.242.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.243.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.243.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.243.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.244.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.244.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.244.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.245.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.245.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.245.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.246.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.246.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.246.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.247.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.247.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.247.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.248.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.248.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.248.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.249.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.249.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.249.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.250.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.250.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.250.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.251.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.251.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.251.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.252.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.252.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.252.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.253.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.253.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.253.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.254.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.254.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.254.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.255.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.255.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.255.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.input_layernorm.weight": "model-00051-of-000163.safetensors", + "model.layers.20.post_attention_layernorm.weight": "model-00051-of-000163.safetensors", + "model.layers.21.self_attn.q_a_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.self_attn.q_a_layernorm.weight": "model-00051-of-000163.safetensors", + "model.layers.21.self_attn.q_b_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.self_attn.kv_a_proj_with_mqa.weight": "model-00051-of-000163.safetensors", + "model.layers.21.self_attn.kv_a_layernorm.weight": "model-00051-of-000163.safetensors", + "model.layers.21.self_attn.kv_b_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.self_attn.o_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.gate.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.gate.e_score_correction_bias": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.shared_experts.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.shared_experts.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.shared_experts.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.0.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.0.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.0.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.1.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.1.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.1.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.2.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.2.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.2.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.3.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.3.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.3.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.4.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.4.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.4.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.5.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.5.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.5.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.6.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.6.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.6.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.7.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.7.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.7.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.8.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.8.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.8.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.9.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.9.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.9.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.10.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.10.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.10.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.11.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.11.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.11.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.12.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.12.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.12.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.13.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.13.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.13.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.14.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.14.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.14.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.15.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.15.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.15.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.16.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.16.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.16.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.17.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.17.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.17.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.18.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.18.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.18.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.19.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.19.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.19.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.20.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.20.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.20.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.21.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.21.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.21.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.22.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.22.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.22.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.23.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.23.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.23.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.24.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.24.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.24.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.25.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.25.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.25.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.26.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.26.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.26.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.27.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.27.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.27.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.28.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.28.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.28.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.29.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.29.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.29.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.30.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.30.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.30.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.31.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.31.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.31.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.32.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.32.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.32.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.33.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.33.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.33.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.34.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.34.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.34.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.35.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.35.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.35.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.36.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.36.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.36.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.37.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.37.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.37.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.38.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.38.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.38.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.39.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.39.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.39.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.40.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.40.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.40.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.41.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.41.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.41.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.42.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.42.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.42.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.43.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.43.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.43.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.44.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.44.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.44.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.45.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.45.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.45.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.46.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.46.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.46.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.47.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.47.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.47.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.48.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.48.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.48.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.49.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.49.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.49.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.50.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.50.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.50.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.51.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.51.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.51.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.52.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.52.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.52.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.53.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.53.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.53.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.54.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.54.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.54.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.55.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.55.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.55.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.56.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.56.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.56.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.57.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.57.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.57.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.58.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.58.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.58.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.59.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.59.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.59.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.60.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.60.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.60.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.61.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.61.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.61.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.62.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.62.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.62.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.63.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.63.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.63.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.64.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.64.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.64.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.65.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.65.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.65.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.66.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.66.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.66.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.67.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.67.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.67.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.68.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.68.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.68.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.69.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.69.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.69.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.70.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.70.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.70.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.71.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.71.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.71.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.72.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.72.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.72.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.73.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.73.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.73.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.74.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.74.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.74.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.75.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.75.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.75.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.76.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.76.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.76.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.77.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.77.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.77.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.78.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.78.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.78.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.79.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.79.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.79.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.80.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.80.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.80.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.81.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.81.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.81.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.82.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.82.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.82.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.83.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.83.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.83.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.84.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.84.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.84.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.85.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.85.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.85.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.86.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.86.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.86.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.87.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.87.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.87.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.88.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.88.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.88.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.89.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.89.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.89.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.90.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.90.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.90.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.91.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.91.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.91.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.92.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.92.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.92.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.93.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.93.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.93.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.94.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.94.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.94.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.95.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.95.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.95.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.96.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.96.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.96.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.97.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.97.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.97.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.98.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.98.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.98.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.99.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.99.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.99.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.100.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.100.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.100.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.101.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.101.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.101.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.102.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.102.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.102.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.103.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.103.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.103.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.104.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.104.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.104.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.105.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.105.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.105.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.106.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.106.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.106.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.107.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.107.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.107.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.108.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.108.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.108.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.109.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.109.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.109.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.110.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.110.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.110.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.111.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.111.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.111.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.112.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.112.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.112.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.113.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.113.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.113.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.114.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.114.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.114.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.115.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.115.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.115.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.116.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.116.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.116.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.117.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.117.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.117.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.118.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.118.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.118.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.119.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.119.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.119.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.120.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.120.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.120.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.121.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.121.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.121.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.122.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.122.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.122.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.123.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.123.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.123.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.124.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.124.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.124.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.125.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.125.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.125.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.126.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.126.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.126.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.127.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.127.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.127.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.128.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.128.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.128.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.129.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.129.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.129.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.130.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.130.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.130.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.131.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.131.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.131.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.132.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.132.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.132.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.133.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.133.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.133.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.134.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.134.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.134.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.135.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.135.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.135.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.136.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.136.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.136.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.137.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.137.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.137.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.138.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.138.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.138.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.139.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.139.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.139.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.140.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.140.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.140.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.141.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.141.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.141.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.142.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.142.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.142.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.143.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.143.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.143.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.144.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.144.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.144.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.145.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.145.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.145.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.146.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.146.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.146.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.147.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.147.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.147.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.148.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.148.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.148.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.149.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.149.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.149.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.150.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.150.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.150.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.151.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.151.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.151.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.152.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.152.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.152.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.153.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.153.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.153.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.154.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.154.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.154.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.155.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.155.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.155.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.156.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.156.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.156.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.157.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.157.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.157.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.158.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.158.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.158.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.159.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.159.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.159.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.160.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.160.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.160.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.161.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.161.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.161.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.162.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.162.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.162.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.163.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.163.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.163.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.164.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.164.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.164.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.165.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.165.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.165.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.166.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.166.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.166.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.167.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.167.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.167.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.168.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.168.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.168.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.169.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.169.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.169.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.170.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.170.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.170.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.171.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.171.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.171.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.172.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.172.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.172.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.173.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.173.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.173.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.174.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.174.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.174.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.175.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.175.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.175.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.176.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.176.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.176.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.177.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.177.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.177.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.178.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.178.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.178.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.179.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.179.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.179.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.180.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.180.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.180.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.181.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.181.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.181.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.182.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.182.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.182.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.183.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.183.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.183.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.184.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.184.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.184.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.185.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.185.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.185.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.186.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.186.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.186.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.187.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.187.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.187.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.188.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.188.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.188.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.189.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.189.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.189.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.190.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.190.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.190.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.191.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.191.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.191.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.192.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.192.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.192.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.193.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.193.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.193.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.194.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.194.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.194.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.195.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.195.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.195.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.196.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.196.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.196.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.197.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.197.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.197.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.198.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.198.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.198.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.199.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.199.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.199.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.200.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.200.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.200.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.201.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.201.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.201.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.202.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.202.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.202.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.203.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.203.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.203.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.204.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.204.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.204.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.205.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.205.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.205.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.206.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.206.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.206.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.207.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.207.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.207.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.208.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.208.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.208.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.209.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.209.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.209.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.210.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.210.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.210.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.211.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.211.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.211.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.212.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.212.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.212.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.213.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.213.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.213.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.214.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.214.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.214.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.215.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.215.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.215.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.216.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.216.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.216.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.217.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.217.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.217.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.218.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.218.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.218.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.219.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.219.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.219.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.220.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.220.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.220.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.221.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.221.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.221.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.222.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.222.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.222.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.223.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.223.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.223.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.224.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.224.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.224.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.225.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.225.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.225.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.226.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.226.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.226.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.227.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.227.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.227.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.228.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.228.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.228.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.229.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.229.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.229.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.230.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.230.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.230.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.231.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.231.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.231.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.232.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.232.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.232.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.233.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.233.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.233.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.234.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.234.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.234.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.235.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.235.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.235.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.236.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.236.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.236.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.237.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.237.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.237.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.238.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.238.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.238.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.239.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.239.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.239.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.240.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.240.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.240.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.241.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.241.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.241.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.242.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.242.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.242.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.243.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.243.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.243.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.244.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.244.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.244.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.245.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.245.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.245.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.246.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.246.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.246.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.247.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.247.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.247.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.248.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.248.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.248.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.249.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.249.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.249.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.250.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.250.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.250.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.251.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.251.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.251.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.252.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.252.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.252.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.253.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.253.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.253.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.254.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.254.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.254.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.255.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.255.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.255.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.input_layernorm.weight": "model-00053-of-000163.safetensors", + "model.layers.21.post_attention_layernorm.weight": "model-00053-of-000163.safetensors", + "model.layers.22.self_attn.q_a_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.self_attn.q_a_layernorm.weight": "model-00053-of-000163.safetensors", + "model.layers.22.self_attn.q_b_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.self_attn.kv_a_proj_with_mqa.weight": "model-00053-of-000163.safetensors", + "model.layers.22.self_attn.kv_a_layernorm.weight": "model-00053-of-000163.safetensors", + "model.layers.22.self_attn.kv_b_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.self_attn.o_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.gate.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.gate.e_score_correction_bias": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.shared_experts.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.shared_experts.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.shared_experts.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.0.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.0.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.0.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.1.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.1.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.1.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.2.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.2.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.2.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.3.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.3.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.3.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.4.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.4.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.4.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.5.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.5.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.5.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.6.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.6.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.6.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.7.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.7.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.7.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.8.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.8.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.8.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.9.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.9.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.9.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.10.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.10.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.10.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.11.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.11.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.11.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.12.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.12.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.12.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.13.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.13.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.13.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.14.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.14.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.14.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.15.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.15.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.15.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.16.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.16.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.16.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.17.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.17.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.17.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.18.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.18.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.18.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.19.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.19.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.19.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.20.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.20.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.20.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.21.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.21.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.21.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.22.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.22.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.22.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.23.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.23.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.23.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.24.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.24.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.24.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.25.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.25.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.25.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.26.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.26.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.26.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.27.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.27.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.27.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.28.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.28.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.28.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.29.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.29.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.29.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.30.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.30.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.30.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.31.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.31.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.31.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.32.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.32.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.32.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.33.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.33.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.33.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.34.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.34.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.34.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.35.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.35.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.35.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.36.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.36.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.36.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.37.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.37.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.37.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.38.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.38.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.38.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.39.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.39.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.39.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.40.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.40.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.40.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.41.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.41.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.41.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.42.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.42.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.42.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.43.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.43.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.43.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.44.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.44.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.44.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.45.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.45.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.45.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.46.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.46.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.46.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.47.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.47.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.47.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.48.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.48.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.48.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.49.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.49.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.49.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.50.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.50.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.50.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.51.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.51.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.51.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.52.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.52.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.52.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.53.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.53.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.53.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.54.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.54.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.54.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.55.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.55.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.55.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.56.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.56.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.56.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.57.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.57.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.57.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.58.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.58.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.58.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.59.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.59.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.59.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.60.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.60.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.60.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.61.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.61.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.61.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.62.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.62.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.62.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.63.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.63.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.63.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.64.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.64.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.64.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.65.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.65.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.65.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.66.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.66.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.66.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.67.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.67.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.67.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.68.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.68.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.68.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.69.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.69.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.69.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.70.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.70.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.70.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.71.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.71.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.71.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.72.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.72.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.72.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.73.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.73.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.73.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.74.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.74.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.74.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.75.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.75.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.75.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.76.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.76.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.76.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.77.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.77.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.77.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.78.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.78.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.78.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.79.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.79.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.79.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.80.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.80.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.80.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.81.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.81.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.81.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.82.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.82.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.82.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.83.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.83.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.83.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.84.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.84.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.84.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.85.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.85.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.85.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.86.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.86.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.86.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.87.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.87.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.87.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.88.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.88.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.88.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.89.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.89.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.89.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.90.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.90.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.90.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.91.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.91.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.91.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.92.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.92.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.92.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.93.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.93.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.93.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.94.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.94.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.94.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.95.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.95.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.95.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.96.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.96.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.96.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.97.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.97.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.97.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.98.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.98.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.98.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.99.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.99.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.99.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.100.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.100.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.100.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.101.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.101.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.101.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.102.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.102.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.102.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.103.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.103.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.103.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.104.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.104.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.104.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.105.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.105.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.105.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.106.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.106.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.106.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.107.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.107.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.107.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.108.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.108.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.108.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.109.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.109.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.109.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.110.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.110.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.110.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.111.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.111.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.111.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.112.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.112.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.112.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.113.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.113.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.113.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.114.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.114.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.114.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.115.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.115.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.115.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.116.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.116.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.116.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.117.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.117.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.117.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.118.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.118.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.118.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.119.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.119.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.119.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.120.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.120.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.120.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.121.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.121.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.121.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.122.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.122.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.122.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.123.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.123.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.123.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.124.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.124.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.124.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.125.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.125.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.125.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.126.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.126.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.126.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.127.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.127.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.127.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.128.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.128.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.128.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.129.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.129.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.129.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.130.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.130.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.130.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.131.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.131.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.131.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.132.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.132.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.132.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.133.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.133.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.133.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.134.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.134.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.134.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.135.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.135.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.135.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.136.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.136.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.136.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.137.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.137.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.137.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.138.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.138.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.138.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.139.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.139.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.139.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.140.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.140.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.140.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.141.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.141.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.141.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.142.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.142.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.142.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.143.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.143.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.143.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.144.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.144.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.144.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.145.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.145.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.145.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.146.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.146.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.146.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.147.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.147.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.147.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.148.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.148.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.148.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.149.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.149.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.149.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.150.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.150.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.150.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.151.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.151.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.151.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.152.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.152.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.152.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.153.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.153.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.153.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.154.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.154.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.154.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.155.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.155.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.155.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.156.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.156.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.156.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.157.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.157.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.157.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.158.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.158.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.158.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.159.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.159.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.159.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.160.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.160.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.160.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.161.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.161.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.161.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.162.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.162.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.162.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.163.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.163.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.163.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.164.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.164.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.164.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.165.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.165.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.165.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.166.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.166.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.166.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.167.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.167.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.167.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.168.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.168.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.168.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.169.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.169.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.169.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.170.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.170.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.170.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.171.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.171.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.171.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.172.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.172.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.172.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.173.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.173.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.173.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.174.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.174.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.174.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.175.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.175.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.175.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.176.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.176.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.176.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.177.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.177.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.177.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.178.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.178.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.178.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.179.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.179.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.179.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.180.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.180.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.180.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.181.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.181.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.181.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.182.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.182.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.182.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.183.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.183.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.183.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.184.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.184.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.184.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.185.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.185.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.185.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.186.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.186.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.186.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.187.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.187.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.187.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.188.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.188.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.188.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.189.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.189.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.189.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.190.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.190.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.190.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.191.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.191.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.191.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.192.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.192.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.192.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.193.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.193.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.193.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.194.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.194.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.194.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.195.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.195.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.195.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.196.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.196.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.196.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.197.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.197.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.197.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.198.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.198.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.198.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.199.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.199.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.199.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.200.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.200.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.200.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.201.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.201.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.201.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.202.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.202.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.202.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.203.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.203.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.203.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.204.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.204.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.204.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.205.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.205.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.205.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.206.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.206.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.206.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.207.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.207.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.207.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.208.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.208.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.208.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.209.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.209.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.209.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.210.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.210.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.210.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.211.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.211.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.211.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.212.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.212.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.212.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.213.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.213.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.213.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.214.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.214.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.214.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.215.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.215.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.215.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.216.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.216.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.216.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.217.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.217.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.217.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.218.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.218.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.218.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.219.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.219.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.219.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.220.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.220.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.220.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.221.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.221.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.221.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.222.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.222.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.222.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.223.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.223.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.223.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.224.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.224.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.224.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.225.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.225.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.225.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.226.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.226.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.226.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.227.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.227.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.227.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.228.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.228.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.228.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.229.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.229.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.229.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.230.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.230.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.230.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.231.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.231.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.231.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.232.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.232.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.232.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.233.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.233.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.233.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.234.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.234.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.234.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.235.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.235.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.235.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.236.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.236.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.236.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.237.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.237.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.237.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.238.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.238.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.238.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.239.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.239.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.239.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.240.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.240.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.240.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.241.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.241.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.241.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.242.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.242.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.242.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.243.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.243.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.243.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.244.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.244.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.244.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.245.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.245.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.245.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.246.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.246.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.246.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.247.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.247.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.247.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.248.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.248.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.248.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.249.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.249.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.249.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.250.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.250.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.250.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.251.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.251.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.251.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.252.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.252.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.252.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.253.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.253.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.253.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.254.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.254.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.254.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.255.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.255.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.255.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.input_layernorm.weight": "model-00056-of-000163.safetensors", + "model.layers.22.post_attention_layernorm.weight": "model-00056-of-000163.safetensors", + "model.layers.23.self_attn.q_a_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.self_attn.q_a_layernorm.weight": "model-00057-of-000163.safetensors", + "model.layers.23.self_attn.q_b_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.self_attn.kv_a_proj_with_mqa.weight": "model-00057-of-000163.safetensors", + "model.layers.23.self_attn.kv_a_layernorm.weight": "model-00057-of-000163.safetensors", + "model.layers.23.self_attn.kv_b_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.self_attn.o_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.gate.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.gate.e_score_correction_bias": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.shared_experts.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.shared_experts.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.shared_experts.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.0.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.0.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.0.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.1.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.1.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.1.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.2.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.2.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.2.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.3.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.3.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.3.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.4.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.4.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.4.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.5.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.5.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.5.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.6.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.6.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.6.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.7.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.7.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.7.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.8.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.8.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.8.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.9.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.9.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.9.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.10.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.10.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.10.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.11.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.11.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.11.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.12.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.12.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.12.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.13.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.13.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.13.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.14.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.14.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.14.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.15.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.15.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.15.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.16.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.16.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.16.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.17.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.17.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.17.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.18.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.18.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.18.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.19.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.19.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.19.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.20.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.20.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.20.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.21.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.21.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.21.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.22.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.22.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.22.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.23.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.23.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.23.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.24.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.24.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.24.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.25.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.25.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.25.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.26.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.26.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.26.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.27.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.27.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.27.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.28.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.28.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.28.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.29.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.29.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.29.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.30.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.30.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.30.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.31.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.31.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.31.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.32.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.32.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.32.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.33.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.33.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.33.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.34.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.34.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.34.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.35.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.35.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.35.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.36.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.36.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.36.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.37.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.37.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.37.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.38.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.38.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.38.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.39.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.39.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.39.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.40.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.40.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.40.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.41.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.41.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.41.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.42.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.42.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.42.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.43.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.43.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.43.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.44.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.44.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.44.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.45.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.45.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.45.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.46.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.46.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.46.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.47.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.47.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.47.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.48.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.48.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.48.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.49.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.49.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.49.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.50.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.50.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.50.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.51.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.51.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.51.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.52.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.52.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.52.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.53.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.53.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.53.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.54.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.54.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.54.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.55.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.55.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.55.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.56.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.56.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.56.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.57.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.57.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.57.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.58.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.58.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.58.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.59.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.59.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.59.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.60.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.60.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.60.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.61.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.61.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.61.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.62.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.62.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.62.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.63.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.63.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.63.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.64.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.64.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.64.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.65.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.65.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.65.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.66.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.66.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.66.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.67.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.67.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.67.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.68.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.68.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.68.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.69.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.69.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.69.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.70.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.70.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.70.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.71.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.71.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.71.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.72.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.72.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.72.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.73.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.73.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.73.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.74.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.74.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.74.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.75.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.75.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.75.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.76.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.76.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.76.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.77.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.77.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.77.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.78.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.78.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.78.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.79.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.79.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.79.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.80.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.80.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.80.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.81.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.81.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.81.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.82.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.82.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.82.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.83.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.83.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.83.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.84.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.84.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.84.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.85.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.85.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.85.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.86.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.86.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.86.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.87.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.87.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.87.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.88.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.88.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.88.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.89.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.89.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.89.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.90.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.90.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.90.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.91.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.91.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.91.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.92.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.92.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.92.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.93.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.93.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.93.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.94.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.94.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.94.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.95.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.95.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.95.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.96.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.96.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.96.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.97.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.97.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.97.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.98.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.98.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.98.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.99.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.99.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.99.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.100.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.100.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.100.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.101.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.101.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.101.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.102.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.102.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.102.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.103.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.103.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.103.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.104.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.104.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.104.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.105.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.105.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.105.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.106.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.106.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.106.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.107.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.107.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.107.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.108.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.108.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.108.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.109.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.109.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.109.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.110.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.110.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.110.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.111.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.111.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.111.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.112.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.112.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.112.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.113.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.113.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.113.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.114.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.114.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.114.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.115.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.115.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.115.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.116.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.116.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.116.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.117.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.117.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.117.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.118.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.118.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.118.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.119.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.119.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.119.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.120.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.120.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.120.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.121.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.121.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.121.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.122.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.122.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.122.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.123.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.123.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.123.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.124.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.124.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.124.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.125.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.125.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.125.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.126.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.126.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.126.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.127.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.127.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.127.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.128.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.128.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.128.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.129.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.129.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.129.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.130.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.130.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.130.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.131.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.131.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.131.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.132.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.132.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.132.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.133.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.133.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.133.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.134.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.134.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.134.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.135.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.135.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.135.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.136.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.136.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.136.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.137.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.137.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.137.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.138.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.138.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.138.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.139.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.139.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.139.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.140.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.140.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.140.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.141.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.141.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.141.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.142.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.142.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.142.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.143.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.143.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.143.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.144.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.144.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.144.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.145.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.145.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.145.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.146.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.146.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.146.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.147.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.147.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.147.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.148.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.148.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.148.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.149.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.149.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.149.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.150.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.150.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.150.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.151.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.151.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.151.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.152.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.152.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.152.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.153.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.153.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.153.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.154.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.154.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.154.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.155.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.155.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.155.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.156.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.156.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.156.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.157.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.157.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.157.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.158.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.158.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.158.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.159.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.159.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.159.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.160.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.160.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.160.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.161.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.161.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.161.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.162.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.162.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.162.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.163.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.163.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.163.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.164.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.164.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.164.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.165.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.165.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.165.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.166.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.166.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.166.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.167.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.167.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.167.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.168.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.168.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.168.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.169.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.169.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.169.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.170.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.170.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.170.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.171.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.171.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.171.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.172.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.172.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.172.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.173.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.173.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.173.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.174.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.174.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.174.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.175.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.175.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.175.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.176.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.176.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.176.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.177.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.177.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.177.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.178.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.178.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.178.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.179.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.179.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.179.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.180.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.180.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.180.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.181.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.181.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.181.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.182.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.182.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.182.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.183.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.183.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.183.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.184.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.184.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.184.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.185.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.185.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.185.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.186.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.186.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.186.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.187.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.187.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.187.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.188.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.188.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.188.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.189.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.189.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.189.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.190.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.190.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.190.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.191.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.191.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.191.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.192.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.192.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.192.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.193.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.193.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.193.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.194.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.194.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.194.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.195.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.195.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.195.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.196.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.196.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.196.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.197.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.197.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.197.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.198.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.198.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.198.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.199.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.199.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.199.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.200.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.200.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.200.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.201.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.201.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.201.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.202.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.202.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.202.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.203.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.203.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.203.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.204.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.204.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.204.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.205.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.205.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.205.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.206.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.206.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.206.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.207.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.207.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.207.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.208.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.208.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.208.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.209.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.209.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.209.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.210.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.210.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.210.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.211.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.211.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.211.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.212.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.212.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.212.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.213.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.213.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.213.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.214.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.214.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.214.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.215.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.215.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.215.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.216.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.216.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.216.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.217.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.217.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.217.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.218.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.218.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.218.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.219.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.219.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.219.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.220.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.220.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.220.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.221.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.221.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.221.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.222.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.222.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.222.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.223.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.223.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.223.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.224.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.224.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.224.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.225.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.225.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.225.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.226.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.226.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.226.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.227.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.227.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.227.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.228.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.228.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.228.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.229.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.229.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.229.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.230.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.230.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.230.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.231.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.231.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.231.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.232.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.232.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.232.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.233.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.233.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.233.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.234.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.234.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.234.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.235.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.235.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.235.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.236.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.236.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.236.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.237.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.237.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.237.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.238.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.238.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.238.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.239.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.239.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.239.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.240.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.240.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.240.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.241.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.241.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.241.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.242.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.242.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.242.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.243.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.243.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.243.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.244.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.244.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.244.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.245.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.245.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.245.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.246.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.246.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.246.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.247.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.247.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.247.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.248.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.248.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.248.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.249.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.249.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.249.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.250.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.250.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.250.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.251.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.251.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.251.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.252.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.252.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.252.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.253.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.253.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.253.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.254.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.254.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.254.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.255.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.255.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.255.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.input_layernorm.weight": "model-00059-of-000163.safetensors", + "model.layers.23.post_attention_layernorm.weight": "model-00059-of-000163.safetensors", + "model.layers.24.self_attn.q_a_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.self_attn.q_a_layernorm.weight": "model-00059-of-000163.safetensors", + "model.layers.24.self_attn.q_b_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.self_attn.kv_a_proj_with_mqa.weight": "model-00059-of-000163.safetensors", + "model.layers.24.self_attn.kv_a_layernorm.weight": "model-00059-of-000163.safetensors", + "model.layers.24.self_attn.kv_b_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.self_attn.o_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.gate.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.gate.e_score_correction_bias": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.shared_experts.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.shared_experts.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.shared_experts.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.0.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.0.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.0.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.1.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.1.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.1.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.2.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.2.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.2.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.3.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.3.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.3.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.4.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.4.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.4.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.5.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.5.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.5.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.6.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.6.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.6.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.7.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.7.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.7.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.8.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.8.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.8.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.9.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.9.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.9.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.10.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.10.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.10.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.11.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.11.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.11.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.12.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.12.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.12.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.13.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.13.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.13.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.14.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.14.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.14.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.15.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.15.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.15.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.16.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.16.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.16.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.17.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.17.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.17.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.18.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.18.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.18.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.19.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.19.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.19.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.20.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.20.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.20.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.21.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.21.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.21.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.22.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.22.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.22.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.23.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.23.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.23.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.24.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.24.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.24.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.25.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.25.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.25.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.26.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.26.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.26.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.27.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.27.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.27.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.28.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.28.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.28.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.29.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.29.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.29.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.30.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.30.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.30.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.31.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.31.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.31.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.32.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.32.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.32.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.33.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.33.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.33.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.34.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.34.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.34.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.35.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.35.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.35.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.36.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.36.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.36.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.37.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.37.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.37.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.38.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.38.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.38.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.39.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.39.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.39.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.40.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.40.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.40.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.41.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.41.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.41.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.42.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.42.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.42.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.43.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.43.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.43.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.44.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.44.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.44.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.45.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.45.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.45.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.46.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.46.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.46.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.47.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.47.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.47.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.48.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.48.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.48.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.49.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.49.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.49.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.50.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.50.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.50.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.51.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.51.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.51.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.52.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.52.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.52.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.53.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.53.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.53.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.54.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.54.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.54.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.55.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.55.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.55.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.56.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.56.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.56.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.57.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.57.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.57.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.58.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.58.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.58.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.59.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.59.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.59.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.60.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.60.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.60.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.61.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.61.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.61.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.62.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.62.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.62.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.63.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.63.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.63.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.64.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.64.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.64.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.65.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.65.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.65.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.66.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.66.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.66.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.67.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.67.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.67.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.68.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.68.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.68.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.69.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.69.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.69.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.70.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.70.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.70.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.71.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.71.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.71.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.72.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.72.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.72.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.73.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.73.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.73.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.74.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.74.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.74.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.75.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.75.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.75.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.76.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.76.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.76.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.77.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.77.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.77.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.78.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.78.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.78.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.79.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.79.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.79.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.80.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.80.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.80.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.81.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.81.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.81.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.82.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.82.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.82.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.83.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.83.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.83.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.84.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.84.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.84.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.85.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.85.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.85.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.86.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.86.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.86.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.87.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.87.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.87.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.88.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.88.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.88.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.89.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.89.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.89.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.90.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.90.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.90.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.91.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.91.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.91.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.92.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.92.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.92.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.93.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.93.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.93.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.94.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.94.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.94.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.95.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.95.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.95.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.96.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.96.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.96.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.97.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.97.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.97.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.98.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.98.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.98.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.99.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.99.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.99.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.100.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.100.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.100.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.101.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.101.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.101.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.102.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.102.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.102.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.103.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.103.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.103.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.104.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.104.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.104.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.105.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.105.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.105.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.106.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.106.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.106.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.107.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.107.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.107.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.108.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.108.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.108.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.109.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.109.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.109.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.110.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.110.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.110.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.111.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.111.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.111.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.112.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.112.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.112.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.113.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.113.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.113.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.114.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.114.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.114.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.115.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.115.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.115.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.116.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.116.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.116.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.117.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.117.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.117.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.118.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.118.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.118.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.119.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.119.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.119.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.120.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.120.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.120.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.121.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.121.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.121.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.122.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.122.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.122.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.123.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.123.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.123.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.124.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.124.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.124.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.125.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.125.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.125.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.126.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.126.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.126.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.127.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.127.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.127.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.128.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.128.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.128.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.129.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.129.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.129.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.130.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.130.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.130.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.131.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.131.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.131.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.132.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.132.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.132.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.133.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.133.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.133.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.134.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.134.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.134.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.135.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.135.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.135.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.136.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.136.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.136.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.137.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.137.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.137.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.138.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.138.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.138.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.139.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.139.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.139.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.140.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.140.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.140.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.141.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.141.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.141.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.142.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.142.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.142.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.143.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.143.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.143.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.144.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.144.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.144.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.145.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.145.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.145.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.146.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.146.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.146.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.147.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.147.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.147.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.148.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.148.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.148.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.149.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.149.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.149.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.150.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.150.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.150.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.151.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.151.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.151.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.152.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.152.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.152.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.153.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.153.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.153.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.154.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.154.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.154.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.155.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.155.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.155.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.156.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.156.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.156.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.157.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.157.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.157.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.158.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.158.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.158.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.159.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.159.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.159.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.160.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.160.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.160.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.161.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.161.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.161.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.162.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.162.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.162.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.163.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.163.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.163.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.164.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.164.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.164.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.165.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.165.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.165.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.166.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.166.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.166.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.167.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.167.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.167.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.168.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.168.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.168.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.169.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.169.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.169.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.170.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.170.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.170.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.171.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.171.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.171.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.172.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.172.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.172.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.173.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.173.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.173.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.174.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.174.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.174.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.175.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.175.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.175.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.176.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.176.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.176.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.177.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.177.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.177.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.178.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.178.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.178.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.179.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.179.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.179.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.180.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.180.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.180.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.181.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.181.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.181.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.182.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.182.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.182.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.183.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.183.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.183.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.184.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.184.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.184.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.185.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.185.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.185.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.186.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.186.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.186.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.187.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.187.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.187.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.188.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.188.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.188.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.189.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.189.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.189.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.190.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.190.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.190.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.191.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.191.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.191.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.192.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.192.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.192.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.193.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.193.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.193.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.194.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.194.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.194.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.195.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.195.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.195.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.196.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.196.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.196.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.197.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.197.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.197.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.198.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.198.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.198.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.199.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.199.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.199.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.200.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.200.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.200.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.201.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.201.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.201.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.202.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.202.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.202.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.203.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.203.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.203.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.204.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.204.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.204.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.205.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.205.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.205.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.206.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.206.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.206.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.207.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.207.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.207.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.208.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.208.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.208.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.209.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.209.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.209.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.210.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.210.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.210.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.211.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.211.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.211.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.212.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.212.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.212.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.213.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.213.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.213.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.214.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.214.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.214.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.215.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.215.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.215.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.216.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.216.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.216.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.217.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.217.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.217.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.218.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.218.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.218.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.219.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.219.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.219.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.220.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.220.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.220.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.221.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.221.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.221.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.222.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.222.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.222.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.223.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.223.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.223.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.224.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.224.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.224.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.225.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.225.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.225.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.226.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.226.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.226.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.227.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.227.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.227.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.228.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.228.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.228.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.229.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.229.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.229.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.230.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.230.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.230.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.231.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.231.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.231.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.232.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.232.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.232.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.233.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.233.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.233.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.234.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.234.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.234.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.235.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.235.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.235.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.236.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.236.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.236.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.237.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.237.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.237.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.238.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.238.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.238.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.239.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.239.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.239.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.240.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.240.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.240.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.241.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.241.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.241.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.242.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.242.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.242.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.243.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.243.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.243.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.244.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.244.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.244.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.245.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.245.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.245.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.246.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.246.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.246.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.247.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.247.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.247.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.248.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.248.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.248.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.249.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.249.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.249.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.250.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.250.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.250.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.251.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.251.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.251.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.252.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.252.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.252.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.253.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.253.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.253.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.254.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.254.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.254.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.255.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.255.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.255.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.input_layernorm.weight": "model-00062-of-000163.safetensors", + "model.layers.24.post_attention_layernorm.weight": "model-00062-of-000163.safetensors", + "model.layers.25.self_attn.q_a_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.self_attn.q_a_layernorm.weight": "model-00062-of-000163.safetensors", + "model.layers.25.self_attn.q_b_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.self_attn.kv_a_proj_with_mqa.weight": "model-00062-of-000163.safetensors", + "model.layers.25.self_attn.kv_a_layernorm.weight": "model-00062-of-000163.safetensors", + "model.layers.25.self_attn.kv_b_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.self_attn.o_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.gate.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.gate.e_score_correction_bias": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.shared_experts.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.shared_experts.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.shared_experts.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.0.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.0.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.0.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.1.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.1.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.1.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.2.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.2.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.2.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.3.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.3.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.3.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.4.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.4.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.4.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.5.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.5.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.5.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.6.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.6.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.6.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.7.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.7.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.7.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.8.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.8.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.8.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.9.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.9.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.9.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.10.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.10.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.10.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.11.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.11.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.11.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.12.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.12.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.12.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.13.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.13.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.13.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.14.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.14.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.14.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.15.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.15.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.15.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.16.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.16.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.16.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.17.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.17.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.17.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.18.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.18.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.18.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.19.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.19.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.19.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.20.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.20.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.20.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.21.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.21.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.21.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.22.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.22.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.22.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.23.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.23.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.23.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.24.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.24.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.24.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.25.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.25.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.25.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.26.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.26.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.26.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.27.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.27.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.27.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.28.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.28.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.28.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.29.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.29.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.29.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.30.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.30.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.30.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.31.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.31.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.31.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.32.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.32.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.32.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.33.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.33.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.33.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.34.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.34.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.34.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.35.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.35.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.35.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.36.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.36.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.36.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.37.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.37.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.37.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.38.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.38.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.38.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.39.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.39.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.39.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.40.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.40.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.40.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.41.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.41.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.41.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.42.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.42.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.42.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.43.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.43.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.43.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.44.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.44.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.44.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.45.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.45.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.45.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.46.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.46.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.46.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.47.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.47.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.47.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.48.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.48.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.48.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.49.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.49.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.49.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.50.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.50.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.50.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.51.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.51.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.51.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.52.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.52.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.52.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.53.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.53.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.53.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.54.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.54.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.54.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.55.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.55.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.55.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.56.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.56.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.56.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.57.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.57.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.57.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.58.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.58.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.58.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.59.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.59.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.59.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.60.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.60.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.60.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.61.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.61.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.61.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.62.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.62.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.62.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.63.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.63.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.63.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.64.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.64.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.64.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.65.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.65.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.65.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.66.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.66.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.66.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.67.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.67.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.67.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.68.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.68.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.68.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.69.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.69.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.69.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.70.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.70.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.70.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.71.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.71.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.71.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.72.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.72.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.72.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.73.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.73.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.73.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.74.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.74.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.74.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.75.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.75.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.75.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.76.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.76.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.76.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.77.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.77.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.77.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.78.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.78.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.78.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.79.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.79.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.79.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.80.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.80.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.80.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.81.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.81.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.81.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.82.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.82.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.82.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.83.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.83.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.83.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.84.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.84.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.84.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.85.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.85.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.85.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.86.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.86.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.86.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.87.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.87.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.87.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.88.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.88.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.88.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.89.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.89.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.89.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.90.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.90.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.90.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.91.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.91.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.91.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.92.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.92.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.92.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.93.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.93.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.93.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.94.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.94.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.94.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.95.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.95.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.95.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.96.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.96.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.96.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.97.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.97.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.97.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.98.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.98.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.98.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.99.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.99.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.99.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.100.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.100.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.100.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.101.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.101.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.101.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.102.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.102.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.102.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.103.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.103.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.103.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.104.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.104.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.104.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.105.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.105.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.105.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.106.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.106.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.106.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.107.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.107.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.107.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.108.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.108.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.108.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.109.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.109.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.109.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.110.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.110.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.110.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.111.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.111.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.111.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.112.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.112.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.112.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.113.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.113.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.113.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.114.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.114.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.114.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.115.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.115.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.115.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.116.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.116.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.116.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.117.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.117.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.117.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.118.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.118.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.118.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.119.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.119.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.119.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.120.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.120.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.120.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.121.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.121.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.121.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.122.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.122.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.122.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.123.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.123.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.123.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.124.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.124.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.124.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.125.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.125.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.125.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.126.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.126.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.126.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.127.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.127.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.127.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.128.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.128.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.128.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.129.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.129.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.129.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.130.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.130.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.130.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.131.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.131.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.131.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.132.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.132.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.132.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.133.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.133.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.133.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.134.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.134.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.134.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.135.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.135.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.135.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.136.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.136.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.136.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.137.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.137.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.137.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.138.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.138.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.138.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.139.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.139.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.139.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.140.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.140.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.140.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.141.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.141.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.141.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.142.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.142.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.142.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.143.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.143.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.143.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.144.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.144.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.144.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.145.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.145.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.145.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.146.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.146.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.146.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.147.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.147.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.147.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.148.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.148.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.148.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.149.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.149.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.149.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.150.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.150.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.150.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.151.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.151.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.151.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.152.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.152.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.152.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.153.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.153.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.153.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.154.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.154.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.154.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.155.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.155.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.155.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.156.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.156.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.156.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.157.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.157.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.157.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.158.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.158.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.158.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.159.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.159.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.159.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.160.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.160.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.160.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.161.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.161.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.161.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.162.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.162.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.162.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.163.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.163.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.163.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.164.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.164.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.164.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.165.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.165.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.165.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.166.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.166.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.166.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.167.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.167.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.167.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.168.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.168.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.168.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.169.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.169.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.169.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.170.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.170.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.170.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.171.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.171.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.171.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.172.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.172.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.172.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.173.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.173.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.173.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.174.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.174.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.174.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.175.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.175.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.175.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.176.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.176.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.176.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.177.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.177.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.177.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.178.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.178.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.178.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.179.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.179.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.179.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.180.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.180.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.180.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.181.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.181.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.181.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.182.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.182.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.182.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.183.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.183.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.183.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.184.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.184.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.184.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.185.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.185.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.185.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.186.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.186.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.186.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.187.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.187.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.187.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.188.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.188.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.188.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.189.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.189.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.189.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.190.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.190.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.190.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.191.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.191.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.191.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.192.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.192.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.192.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.193.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.193.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.193.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.194.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.194.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.194.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.195.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.195.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.195.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.196.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.196.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.196.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.197.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.197.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.197.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.198.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.198.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.198.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.199.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.199.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.199.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.200.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.200.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.200.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.201.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.201.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.201.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.202.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.202.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.202.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.203.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.203.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.203.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.204.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.204.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.204.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.205.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.205.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.205.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.206.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.206.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.206.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.207.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.207.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.207.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.208.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.208.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.208.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.209.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.209.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.209.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.210.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.210.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.210.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.211.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.211.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.211.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.212.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.212.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.212.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.213.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.213.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.213.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.214.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.214.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.214.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.215.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.215.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.215.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.216.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.216.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.216.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.217.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.217.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.217.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.218.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.218.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.218.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.219.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.219.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.219.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.220.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.220.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.220.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.221.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.221.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.221.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.222.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.222.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.222.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.223.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.223.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.223.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.224.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.224.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.224.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.225.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.225.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.225.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.226.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.226.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.226.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.227.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.227.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.227.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.228.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.228.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.228.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.229.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.229.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.229.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.230.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.230.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.230.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.231.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.231.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.231.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.232.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.232.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.232.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.233.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.233.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.233.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.234.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.234.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.234.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.235.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.235.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.235.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.236.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.236.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.236.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.237.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.237.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.237.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.238.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.238.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.238.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.239.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.239.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.239.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.240.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.240.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.240.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.241.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.241.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.241.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.242.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.242.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.242.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.243.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.243.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.243.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.244.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.244.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.244.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.245.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.245.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.245.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.246.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.246.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.246.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.247.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.247.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.247.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.248.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.248.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.248.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.249.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.249.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.249.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.250.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.250.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.250.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.251.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.251.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.251.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.252.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.252.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.252.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.253.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.253.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.25.mlp.experts.253.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.25.mlp.experts.254.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.25.mlp.experts.254.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.25.mlp.experts.254.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.25.mlp.experts.255.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.25.mlp.experts.255.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.25.mlp.experts.255.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.25.input_layernorm.weight": "model-00065-of-000163.safetensors", + "model.layers.25.post_attention_layernorm.weight": "model-00065-of-000163.safetensors", + "model.layers.26.self_attn.q_a_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.self_attn.q_a_layernorm.weight": "model-00065-of-000163.safetensors", + "model.layers.26.self_attn.q_b_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.self_attn.kv_a_proj_with_mqa.weight": "model-00065-of-000163.safetensors", + "model.layers.26.self_attn.kv_a_layernorm.weight": "model-00065-of-000163.safetensors", + "model.layers.26.self_attn.kv_b_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.self_attn.o_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.gate.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.gate.e_score_correction_bias": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.shared_experts.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.shared_experts.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.shared_experts.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.0.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.0.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.0.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.1.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.1.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.1.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.2.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.2.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.2.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.3.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.3.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.3.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.4.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.4.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.4.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.5.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.5.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.5.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.6.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.6.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.6.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.7.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.7.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.7.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.8.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.8.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.8.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.9.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.9.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.9.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.10.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.10.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.10.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.11.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.11.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.11.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.12.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.12.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.12.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.13.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.13.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.13.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.14.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.14.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.14.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.15.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.15.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.15.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.16.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.16.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.16.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.17.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.17.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.17.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.18.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.18.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.18.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.19.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.19.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.19.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.20.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.20.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.20.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.21.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.21.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.21.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.22.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.22.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.22.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.23.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.23.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.23.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.24.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.24.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.24.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.25.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.25.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.25.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.26.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.26.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.26.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.27.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.27.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.27.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.28.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.28.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.28.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.29.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.29.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.29.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.30.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.30.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.30.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.31.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.31.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.31.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.32.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.32.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.32.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.33.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.33.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.33.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.34.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.34.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.34.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.35.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.35.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.35.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.36.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.36.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.36.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.37.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.37.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.37.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.38.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.38.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.38.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.39.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.39.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.39.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.40.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.40.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.40.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.41.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.41.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.41.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.42.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.42.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.42.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.43.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.43.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.43.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.44.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.44.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.44.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.45.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.45.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.45.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.46.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.46.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.46.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.47.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.47.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.47.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.48.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.48.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.48.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.49.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.49.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.49.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.50.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.50.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.50.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.51.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.51.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.51.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.52.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.52.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.52.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.53.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.53.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.53.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.54.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.54.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.54.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.55.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.55.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.55.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.56.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.56.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.56.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.57.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.57.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.57.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.58.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.58.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.58.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.59.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.59.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.59.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.60.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.60.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.60.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.61.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.61.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.61.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.62.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.62.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.62.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.63.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.63.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.63.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.64.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.64.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.64.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.65.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.65.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.65.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.66.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.66.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.66.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.67.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.67.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.67.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.68.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.68.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.68.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.69.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.69.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.69.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.70.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.70.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.70.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.71.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.71.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.71.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.72.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.72.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.72.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.73.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.73.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.73.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.74.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.74.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.74.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.75.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.75.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.75.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.76.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.76.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.76.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.77.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.77.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.77.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.78.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.78.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.78.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.79.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.79.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.79.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.80.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.80.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.80.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.81.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.81.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.81.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.82.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.82.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.82.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.83.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.83.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.83.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.84.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.84.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.84.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.85.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.85.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.85.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.86.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.86.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.86.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.87.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.87.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.87.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.88.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.88.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.88.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.89.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.89.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.89.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.90.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.90.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.90.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.91.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.91.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.91.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.92.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.92.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.92.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.93.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.93.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.93.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.94.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.94.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.94.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.95.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.95.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.95.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.96.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.96.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.96.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.97.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.97.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.97.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.98.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.98.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.98.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.99.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.99.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.99.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.100.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.100.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.100.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.101.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.101.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.101.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.102.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.102.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.102.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.103.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.103.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.103.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.104.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.104.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.104.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.105.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.105.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.105.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.106.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.106.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.106.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.107.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.107.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.107.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.108.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.108.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.108.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.109.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.109.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.109.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.110.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.110.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.110.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.111.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.111.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.111.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.112.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.112.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.112.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.113.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.113.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.113.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.114.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.114.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.114.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.115.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.115.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.115.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.116.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.116.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.116.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.117.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.117.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.117.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.118.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.118.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.118.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.119.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.119.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.119.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.120.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.120.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.120.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.121.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.121.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.121.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.122.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.122.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.122.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.123.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.123.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.123.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.124.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.124.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.124.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.125.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.125.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.125.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.126.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.126.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.126.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.127.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.127.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.127.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.128.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.128.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.128.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.129.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.129.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.129.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.130.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.130.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.130.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.131.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.131.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.131.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.132.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.132.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.132.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.133.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.133.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.133.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.134.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.134.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.134.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.135.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.135.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.135.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.136.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.136.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.136.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.137.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.137.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.137.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.138.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.138.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.138.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.139.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.139.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.139.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.140.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.140.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.140.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.141.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.141.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.141.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.142.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.142.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.142.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.143.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.143.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.143.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.144.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.144.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.144.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.145.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.145.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.145.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.146.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.146.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.146.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.147.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.147.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.147.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.148.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.148.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.148.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.149.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.149.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.149.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.150.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.150.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.150.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.151.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.151.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.151.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.152.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.152.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.152.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.153.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.153.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.153.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.154.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.154.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.154.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.155.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.155.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.155.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.156.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.156.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.156.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.157.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.157.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.157.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.158.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.158.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.158.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.159.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.159.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.159.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.160.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.160.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.160.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.161.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.161.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.161.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.162.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.162.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.162.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.163.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.163.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.163.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.164.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.164.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.164.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.165.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.165.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.165.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.166.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.166.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.166.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.167.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.167.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.167.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.168.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.168.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.168.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.169.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.169.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.169.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.170.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.170.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.170.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.171.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.171.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.171.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.172.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.172.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.172.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.173.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.173.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.173.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.174.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.174.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.174.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.175.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.175.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.175.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.176.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.176.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.176.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.177.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.177.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.177.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.178.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.178.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.178.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.179.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.179.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.179.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.180.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.180.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.180.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.181.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.181.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.181.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.182.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.182.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.182.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.183.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.183.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.183.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.184.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.184.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.184.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.185.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.185.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.185.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.186.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.186.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.186.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.187.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.187.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.187.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.188.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.188.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.188.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.189.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.189.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.189.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.190.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.190.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.190.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.191.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.191.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.191.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.192.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.192.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.192.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.193.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.193.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.193.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.194.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.194.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.194.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.195.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.195.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.195.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.196.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.196.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.196.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.197.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.197.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.197.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.198.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.198.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.198.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.199.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.199.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.199.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.200.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.200.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.200.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.201.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.201.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.201.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.202.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.202.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.202.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.203.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.203.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.203.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.204.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.204.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.204.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.205.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.205.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.205.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.206.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.206.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.206.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.207.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.207.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.207.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.208.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.208.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.208.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.209.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.209.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.209.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.210.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.210.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.210.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.211.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.211.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.211.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.212.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.212.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.212.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.213.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.213.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.213.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.214.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.214.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.214.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.215.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.215.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.215.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.216.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.216.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.216.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.217.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.217.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.217.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.218.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.218.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.218.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.219.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.219.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.219.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.220.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.220.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.220.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.221.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.221.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.221.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.222.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.222.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.222.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.223.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.223.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.223.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.224.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.224.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.224.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.225.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.225.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.225.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.226.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.226.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.226.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.227.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.227.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.227.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.228.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.228.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.228.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.229.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.229.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.229.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.230.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.230.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.230.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.231.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.231.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.231.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.232.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.232.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.232.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.233.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.233.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.233.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.234.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.234.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.234.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.235.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.235.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.235.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.236.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.236.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.236.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.237.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.237.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.237.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.238.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.238.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.238.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.239.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.239.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.239.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.240.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.240.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.240.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.241.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.241.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.241.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.242.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.242.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.242.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.243.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.243.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.243.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.244.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.244.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.244.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.245.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.245.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.245.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.246.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.246.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.246.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.247.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.247.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.247.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.248.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.248.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.248.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.249.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.249.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.249.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.250.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.250.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.250.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.251.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.251.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.251.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.252.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.252.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.252.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.253.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.253.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.253.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.254.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.254.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.254.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.255.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.255.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.255.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.input_layernorm.weight": "model-00067-of-000163.safetensors", + "model.layers.26.post_attention_layernorm.weight": "model-00067-of-000163.safetensors", + "model.layers.27.self_attn.q_a_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.self_attn.q_a_layernorm.weight": "model-00067-of-000163.safetensors", + "model.layers.27.self_attn.q_b_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.self_attn.kv_a_proj_with_mqa.weight": "model-00067-of-000163.safetensors", + "model.layers.27.self_attn.kv_a_layernorm.weight": "model-00067-of-000163.safetensors", + "model.layers.27.self_attn.kv_b_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.self_attn.o_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.gate.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.gate.e_score_correction_bias": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.shared_experts.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.shared_experts.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.shared_experts.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.0.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.0.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.0.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.1.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.1.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.1.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.2.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.2.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.2.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.3.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.3.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.3.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.4.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.4.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.4.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.5.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.5.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.5.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.6.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.6.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.6.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.7.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.7.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.7.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.8.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.8.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.8.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.9.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.9.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.9.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.10.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.10.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.10.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.11.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.11.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.11.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.12.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.12.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.12.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.13.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.13.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.13.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.14.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.14.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.14.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.15.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.15.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.15.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.16.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.16.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.16.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.17.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.17.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.17.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.18.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.18.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.18.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.19.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.19.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.19.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.20.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.20.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.20.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.21.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.21.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.21.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.22.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.22.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.22.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.23.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.23.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.23.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.24.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.24.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.24.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.25.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.25.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.25.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.26.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.26.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.26.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.27.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.27.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.27.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.28.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.28.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.28.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.29.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.29.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.29.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.30.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.30.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.30.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.31.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.31.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.31.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.32.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.32.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.32.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.33.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.33.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.33.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.34.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.34.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.34.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.35.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.35.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.35.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.36.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.36.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.36.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.37.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.37.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.37.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.38.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.38.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.38.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.39.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.39.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.39.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.40.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.40.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.40.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.41.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.41.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.41.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.42.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.42.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.42.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.43.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.43.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.43.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.44.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.44.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.44.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.45.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.45.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.45.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.46.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.46.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.46.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.47.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.47.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.47.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.48.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.48.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.48.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.49.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.49.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.49.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.50.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.50.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.50.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.51.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.51.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.51.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.52.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.52.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.52.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.53.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.53.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.53.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.54.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.54.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.54.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.55.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.55.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.55.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.56.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.56.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.56.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.57.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.57.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.57.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.58.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.58.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.58.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.59.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.59.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.59.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.60.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.60.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.60.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.61.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.61.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.61.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.62.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.62.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.62.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.63.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.63.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.63.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.64.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.64.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.64.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.65.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.65.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.65.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.66.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.66.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.66.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.67.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.67.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.67.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.68.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.68.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.68.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.69.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.69.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.69.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.70.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.70.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.70.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.71.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.71.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.71.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.72.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.72.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.72.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.73.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.73.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.73.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.74.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.74.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.74.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.75.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.75.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.75.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.76.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.76.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.76.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.77.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.77.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.77.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.78.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.78.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.78.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.79.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.79.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.79.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.80.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.80.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.80.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.81.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.81.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.81.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.82.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.82.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.82.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.83.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.83.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.83.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.84.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.84.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.84.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.85.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.85.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.85.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.86.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.86.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.86.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.87.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.87.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.87.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.88.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.88.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.88.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.89.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.89.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.89.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.90.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.90.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.90.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.91.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.91.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.91.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.92.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.92.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.92.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.93.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.93.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.93.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.94.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.94.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.94.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.95.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.95.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.95.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.96.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.96.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.96.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.97.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.97.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.97.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.98.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.98.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.98.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.99.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.99.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.99.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.100.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.100.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.100.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.101.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.101.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.101.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.102.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.102.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.102.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.103.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.103.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.103.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.104.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.104.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.104.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.105.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.105.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.105.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.106.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.106.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.106.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.107.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.107.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.107.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.108.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.108.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.108.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.109.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.109.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.109.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.110.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.110.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.110.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.111.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.111.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.111.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.112.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.112.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.112.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.113.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.113.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.113.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.114.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.114.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.114.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.115.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.115.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.115.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.116.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.116.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.116.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.117.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.117.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.117.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.118.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.118.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.118.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.119.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.119.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.119.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.120.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.120.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.120.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.121.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.121.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.121.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.122.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.122.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.122.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.123.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.123.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.123.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.124.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.124.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.124.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.125.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.125.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.125.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.126.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.126.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.126.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.127.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.127.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.127.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.128.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.128.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.128.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.129.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.129.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.129.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.130.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.130.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.130.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.131.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.131.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.131.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.132.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.132.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.132.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.133.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.133.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.133.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.134.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.134.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.134.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.135.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.135.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.135.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.136.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.136.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.136.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.137.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.137.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.137.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.138.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.138.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.138.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.139.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.139.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.139.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.140.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.140.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.140.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.141.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.141.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.141.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.142.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.142.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.142.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.143.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.143.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.143.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.144.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.144.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.144.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.145.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.145.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.145.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.146.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.146.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.146.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.147.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.147.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.147.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.148.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.148.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.148.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.149.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.149.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.149.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.150.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.150.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.150.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.151.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.151.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.151.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.152.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.152.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.152.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.153.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.153.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.153.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.154.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.154.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.154.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.155.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.155.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.155.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.156.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.156.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.156.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.157.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.157.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.157.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.158.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.158.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.158.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.159.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.159.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.159.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.160.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.160.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.160.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.161.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.161.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.161.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.162.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.162.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.162.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.163.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.163.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.163.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.164.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.164.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.164.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.165.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.165.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.165.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.166.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.166.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.166.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.167.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.167.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.167.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.168.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.168.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.168.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.169.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.169.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.169.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.170.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.170.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.170.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.171.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.171.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.171.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.172.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.172.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.172.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.173.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.173.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.173.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.174.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.174.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.174.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.175.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.175.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.175.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.176.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.176.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.176.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.177.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.177.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.177.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.178.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.178.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.178.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.179.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.179.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.179.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.180.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.180.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.180.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.181.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.181.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.181.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.182.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.182.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.182.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.183.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.183.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.183.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.184.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.184.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.184.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.185.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.185.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.185.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.186.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.186.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.186.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.187.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.187.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.187.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.188.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.188.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.188.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.189.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.189.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.189.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.190.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.190.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.190.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.191.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.191.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.191.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.192.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.192.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.192.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.193.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.193.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.193.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.194.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.194.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.194.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.195.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.195.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.195.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.196.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.196.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.196.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.197.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.197.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.197.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.198.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.198.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.198.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.199.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.199.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.199.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.200.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.200.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.200.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.201.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.201.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.201.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.202.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.202.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.202.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.203.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.203.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.203.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.204.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.204.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.204.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.205.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.205.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.205.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.206.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.206.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.206.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.207.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.207.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.207.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.208.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.208.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.208.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.209.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.209.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.209.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.210.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.210.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.210.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.211.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.211.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.211.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.212.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.212.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.212.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.213.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.213.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.213.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.214.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.214.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.214.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.215.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.215.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.215.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.216.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.216.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.216.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.217.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.217.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.217.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.218.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.218.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.218.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.219.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.219.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.219.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.220.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.220.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.220.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.221.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.221.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.221.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.222.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.222.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.222.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.223.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.223.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.223.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.224.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.224.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.224.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.225.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.225.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.225.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.226.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.226.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.226.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.227.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.227.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.227.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.228.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.228.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.228.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.229.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.229.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.229.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.230.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.230.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.230.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.231.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.231.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.231.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.232.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.232.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.232.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.233.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.233.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.233.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.234.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.234.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.234.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.235.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.235.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.235.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.236.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.236.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.236.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.237.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.237.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.237.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.238.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.238.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.238.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.239.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.239.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.239.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.240.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.240.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.240.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.241.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.241.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.241.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.242.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.242.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.242.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.243.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.243.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.243.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.244.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.244.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.244.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.245.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.245.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.245.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.246.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.246.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.246.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.247.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.247.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.247.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.248.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.248.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.248.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.249.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.249.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.249.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.250.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.250.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.250.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.251.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.251.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.251.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.252.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.252.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.252.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.253.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.253.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.253.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.254.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.254.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.254.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.255.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.255.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.255.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.input_layernorm.weight": "model-00070-of-000163.safetensors", + "model.layers.27.post_attention_layernorm.weight": "model-00070-of-000163.safetensors", + "model.layers.28.self_attn.q_a_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.self_attn.q_a_layernorm.weight": "model-00070-of-000163.safetensors", + "model.layers.28.self_attn.q_b_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.self_attn.kv_a_proj_with_mqa.weight": "model-00070-of-000163.safetensors", + "model.layers.28.self_attn.kv_a_layernorm.weight": "model-00070-of-000163.safetensors", + "model.layers.28.self_attn.kv_b_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.self_attn.o_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.gate.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.gate.e_score_correction_bias": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.shared_experts.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.shared_experts.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.shared_experts.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.0.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.0.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.0.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.1.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.1.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.1.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.2.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.2.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.2.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.3.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.3.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.3.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.4.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.4.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.4.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.5.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.5.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.5.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.6.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.6.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.6.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.7.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.7.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.7.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.8.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.8.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.8.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.9.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.9.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.9.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.10.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.10.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.10.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.11.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.11.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.11.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.12.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.12.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.12.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.13.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.13.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.13.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.14.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.14.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.14.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.15.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.15.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.15.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.16.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.16.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.16.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.17.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.17.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.17.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.18.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.18.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.18.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.19.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.19.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.19.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.20.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.20.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.20.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.21.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.21.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.21.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.22.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.22.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.22.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.23.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.23.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.23.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.24.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.24.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.24.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.25.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.25.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.25.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.26.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.26.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.26.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.27.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.27.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.27.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.28.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.28.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.28.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.29.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.29.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.29.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.30.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.30.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.30.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.31.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.31.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.31.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.32.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.32.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.32.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.33.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.33.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.33.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.34.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.34.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.34.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.35.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.35.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.35.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.36.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.36.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.36.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.37.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.37.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.37.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.38.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.38.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.38.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.39.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.39.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.39.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.40.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.40.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.40.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.41.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.41.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.41.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.42.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.42.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.42.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.43.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.43.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.43.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.44.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.44.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.44.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.45.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.45.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.45.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.46.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.46.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.46.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.47.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.47.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.47.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.48.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.48.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.48.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.49.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.49.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.49.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.50.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.50.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.50.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.51.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.51.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.51.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.52.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.52.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.52.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.53.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.53.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.53.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.54.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.54.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.54.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.55.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.55.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.55.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.56.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.56.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.56.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.57.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.57.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.57.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.58.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.58.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.58.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.59.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.59.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.59.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.60.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.60.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.60.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.61.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.61.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.61.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.62.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.62.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.62.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.63.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.63.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.63.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.64.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.64.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.64.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.65.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.65.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.65.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.66.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.66.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.66.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.67.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.67.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.67.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.68.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.68.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.68.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.69.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.69.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.69.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.70.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.70.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.70.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.71.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.71.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.71.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.72.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.72.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.72.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.73.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.73.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.73.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.74.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.74.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.74.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.75.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.75.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.75.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.76.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.76.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.76.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.77.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.77.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.77.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.78.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.78.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.78.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.79.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.79.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.79.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.80.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.80.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.80.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.81.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.81.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.81.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.82.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.82.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.82.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.83.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.83.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.83.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.84.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.84.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.84.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.85.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.85.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.85.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.86.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.86.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.86.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.87.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.87.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.87.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.88.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.88.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.88.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.89.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.89.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.89.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.90.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.90.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.90.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.91.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.91.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.91.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.92.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.92.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.92.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.93.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.93.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.93.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.94.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.94.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.94.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.95.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.95.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.95.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.96.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.96.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.96.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.97.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.97.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.97.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.98.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.98.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.98.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.99.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.99.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.99.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.100.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.100.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.100.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.101.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.101.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.101.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.102.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.102.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.102.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.103.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.103.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.103.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.104.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.104.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.104.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.105.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.105.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.105.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.106.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.106.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.106.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.107.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.107.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.107.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.108.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.108.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.108.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.109.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.109.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.109.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.110.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.110.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.110.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.111.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.111.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.111.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.112.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.112.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.112.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.113.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.113.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.113.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.114.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.114.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.114.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.115.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.115.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.115.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.116.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.116.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.116.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.117.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.117.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.117.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.118.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.118.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.118.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.119.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.119.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.119.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.120.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.120.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.120.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.121.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.121.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.121.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.122.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.122.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.122.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.123.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.123.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.123.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.124.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.124.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.124.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.125.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.125.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.125.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.126.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.126.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.126.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.127.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.127.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.127.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.128.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.128.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.128.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.129.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.129.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.129.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.130.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.130.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.130.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.131.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.131.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.131.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.132.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.132.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.132.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.133.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.133.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.133.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.134.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.134.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.134.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.135.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.135.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.135.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.136.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.136.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.136.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.137.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.137.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.137.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.138.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.138.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.138.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.139.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.139.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.139.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.140.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.140.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.140.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.141.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.141.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.141.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.142.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.142.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.142.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.143.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.143.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.143.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.144.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.144.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.144.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.145.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.145.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.145.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.146.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.146.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.146.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.147.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.147.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.147.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.148.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.148.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.148.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.149.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.149.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.149.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.150.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.150.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.150.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.151.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.151.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.151.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.152.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.152.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.152.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.153.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.153.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.153.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.154.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.154.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.154.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.155.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.155.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.155.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.156.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.156.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.156.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.157.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.157.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.157.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.158.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.158.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.158.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.159.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.159.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.159.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.160.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.160.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.160.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.161.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.161.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.161.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.162.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.162.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.162.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.163.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.163.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.163.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.164.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.164.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.164.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.165.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.165.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.165.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.166.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.166.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.166.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.167.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.167.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.167.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.168.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.168.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.168.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.169.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.169.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.169.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.170.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.170.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.170.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.171.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.171.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.171.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.172.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.172.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.172.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.173.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.173.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.173.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.174.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.174.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.174.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.175.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.175.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.175.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.176.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.176.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.176.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.177.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.177.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.177.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.178.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.178.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.178.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.179.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.179.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.179.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.180.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.180.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.180.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.181.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.181.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.181.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.182.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.182.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.182.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.183.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.183.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.183.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.184.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.184.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.184.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.185.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.185.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.185.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.186.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.186.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.186.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.187.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.187.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.187.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.188.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.188.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.188.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.189.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.189.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.189.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.190.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.190.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.190.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.191.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.191.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.191.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.192.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.192.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.192.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.193.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.193.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.193.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.194.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.194.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.194.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.195.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.195.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.195.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.196.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.196.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.196.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.197.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.197.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.197.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.198.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.198.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.198.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.199.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.199.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.199.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.200.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.200.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.200.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.201.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.201.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.201.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.202.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.202.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.202.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.203.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.203.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.203.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.204.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.204.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.204.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.205.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.205.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.205.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.206.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.206.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.206.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.207.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.207.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.207.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.208.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.208.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.208.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.209.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.209.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.209.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.210.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.210.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.210.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.211.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.211.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.211.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.212.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.212.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.212.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.213.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.213.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.213.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.214.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.214.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.214.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.215.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.215.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.215.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.216.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.216.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.216.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.217.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.217.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.217.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.218.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.218.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.218.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.219.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.219.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.219.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.220.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.220.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.220.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.221.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.221.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.221.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.222.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.222.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.222.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.223.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.223.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.223.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.224.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.224.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.224.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.225.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.225.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.225.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.226.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.226.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.226.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.227.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.227.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.227.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.228.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.228.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.228.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.229.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.229.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.229.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.230.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.230.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.230.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.231.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.231.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.231.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.232.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.232.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.232.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.233.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.233.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.233.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.234.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.234.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.234.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.235.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.235.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.235.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.236.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.236.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.236.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.237.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.237.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.237.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.238.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.238.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.238.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.239.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.239.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.239.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.240.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.240.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.240.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.241.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.241.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.241.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.242.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.242.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.242.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.243.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.243.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.243.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.244.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.244.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.244.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.245.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.245.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.245.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.246.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.246.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.246.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.247.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.247.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.247.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.248.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.248.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.248.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.249.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.249.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.249.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.250.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.250.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.250.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.251.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.251.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.251.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.252.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.252.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.252.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.253.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.253.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.253.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.254.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.254.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.254.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.255.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.255.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.255.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.input_layernorm.weight": "model-00073-of-000163.safetensors", + "model.layers.28.post_attention_layernorm.weight": "model-00073-of-000163.safetensors", + "model.layers.29.self_attn.q_a_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.self_attn.q_a_layernorm.weight": "model-00073-of-000163.safetensors", + "model.layers.29.self_attn.q_b_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.self_attn.kv_a_proj_with_mqa.weight": "model-00073-of-000163.safetensors", + "model.layers.29.self_attn.kv_a_layernorm.weight": "model-00073-of-000163.safetensors", + "model.layers.29.self_attn.kv_b_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.self_attn.o_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.gate.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.gate.e_score_correction_bias": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.shared_experts.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.shared_experts.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.shared_experts.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.0.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.0.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.0.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.1.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.1.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.1.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.2.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.2.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.2.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.3.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.3.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.3.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.4.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.4.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.4.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.5.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.5.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.5.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.6.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.6.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.6.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.7.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.7.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.7.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.8.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.8.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.8.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.9.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.9.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.9.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.10.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.10.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.10.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.11.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.11.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.11.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.12.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.12.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.12.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.13.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.13.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.13.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.14.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.14.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.14.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.15.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.15.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.15.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.16.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.16.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.16.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.17.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.17.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.17.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.18.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.18.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.18.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.19.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.19.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.19.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.20.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.20.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.20.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.21.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.21.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.21.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.22.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.22.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.22.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.23.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.23.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.23.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.24.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.24.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.24.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.25.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.25.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.25.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.26.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.26.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.26.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.27.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.27.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.27.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.28.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.28.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.28.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.29.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.29.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.29.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.30.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.30.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.30.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.31.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.31.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.31.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.32.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.32.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.32.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.33.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.33.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.33.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.34.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.34.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.34.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.35.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.35.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.35.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.36.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.36.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.36.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.37.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.37.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.37.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.38.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.38.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.38.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.39.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.39.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.39.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.40.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.40.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.40.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.41.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.41.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.41.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.42.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.42.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.42.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.43.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.43.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.43.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.44.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.44.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.44.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.45.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.45.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.45.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.46.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.46.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.46.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.47.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.47.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.47.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.48.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.48.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.48.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.49.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.49.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.49.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.50.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.50.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.50.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.51.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.51.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.51.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.52.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.52.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.52.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.53.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.53.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.53.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.54.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.54.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.54.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.55.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.55.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.55.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.56.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.56.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.56.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.57.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.57.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.57.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.58.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.58.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.58.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.59.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.59.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.59.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.60.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.60.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.60.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.61.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.61.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.61.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.62.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.62.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.62.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.63.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.63.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.63.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.64.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.64.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.64.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.65.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.65.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.65.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.66.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.66.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.66.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.67.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.67.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.67.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.68.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.68.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.68.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.69.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.69.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.69.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.70.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.70.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.70.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.71.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.71.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.71.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.72.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.72.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.72.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.73.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.73.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.73.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.74.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.74.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.74.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.75.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.75.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.75.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.76.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.76.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.76.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.77.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.77.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.77.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.78.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.78.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.78.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.79.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.79.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.79.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.80.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.80.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.80.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.81.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.81.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.81.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.82.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.82.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.82.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.83.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.83.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.83.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.84.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.84.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.84.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.85.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.85.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.85.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.86.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.86.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.86.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.87.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.87.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.87.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.88.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.88.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.88.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.89.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.89.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.89.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.90.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.90.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.90.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.91.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.91.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.91.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.92.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.92.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.92.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.93.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.93.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.93.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.94.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.94.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.94.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.95.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.95.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.95.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.96.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.96.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.96.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.97.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.97.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.97.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.98.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.98.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.98.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.99.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.99.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.99.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.100.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.100.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.100.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.101.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.101.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.101.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.102.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.102.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.102.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.103.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.103.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.103.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.104.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.104.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.104.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.105.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.105.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.105.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.106.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.106.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.106.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.107.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.107.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.107.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.108.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.108.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.108.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.109.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.109.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.109.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.110.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.110.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.110.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.111.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.111.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.111.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.112.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.112.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.112.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.113.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.113.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.113.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.114.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.114.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.114.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.115.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.115.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.115.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.116.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.116.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.116.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.117.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.117.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.117.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.118.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.118.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.118.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.119.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.119.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.119.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.120.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.120.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.120.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.121.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.121.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.121.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.122.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.122.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.122.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.123.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.123.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.123.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.124.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.124.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.124.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.125.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.125.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.125.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.126.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.126.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.126.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.127.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.127.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.127.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.128.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.128.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.128.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.129.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.129.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.129.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.130.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.130.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.130.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.131.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.131.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.131.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.132.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.132.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.132.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.133.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.133.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.133.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.134.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.134.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.134.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.135.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.135.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.135.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.136.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.136.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.136.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.137.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.137.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.137.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.138.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.138.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.138.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.139.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.139.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.139.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.140.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.140.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.140.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.141.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.141.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.141.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.142.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.142.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.142.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.143.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.143.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.143.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.144.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.144.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.144.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.145.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.145.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.145.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.146.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.146.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.146.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.147.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.147.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.147.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.148.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.148.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.148.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.149.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.149.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.149.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.150.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.150.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.150.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.151.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.151.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.151.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.152.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.152.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.152.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.153.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.153.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.153.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.154.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.154.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.154.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.155.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.155.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.155.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.156.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.156.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.156.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.157.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.157.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.157.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.158.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.158.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.158.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.159.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.159.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.159.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.160.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.160.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.160.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.161.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.161.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.161.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.162.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.162.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.162.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.163.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.163.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.163.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.164.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.164.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.164.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.165.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.165.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.165.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.166.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.166.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.166.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.167.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.167.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.167.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.168.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.168.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.168.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.169.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.169.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.169.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.170.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.170.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.170.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.171.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.171.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.171.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.172.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.172.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.172.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.173.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.173.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.173.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.174.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.174.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.174.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.175.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.175.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.175.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.176.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.176.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.176.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.177.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.177.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.177.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.178.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.178.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.178.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.179.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.179.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.179.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.180.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.180.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.180.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.181.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.181.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.181.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.182.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.182.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.182.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.183.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.183.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.183.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.184.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.184.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.184.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.185.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.185.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.185.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.186.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.186.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.186.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.187.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.187.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.187.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.188.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.188.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.188.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.189.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.189.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.189.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.190.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.190.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.190.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.191.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.191.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.191.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.192.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.192.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.192.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.193.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.193.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.193.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.194.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.194.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.194.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.195.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.195.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.195.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.196.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.196.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.196.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.197.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.197.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.197.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.198.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.198.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.198.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.199.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.199.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.199.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.200.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.200.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.200.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.201.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.201.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.201.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.202.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.202.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.202.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.203.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.203.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.203.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.204.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.204.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.204.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.205.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.205.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.205.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.206.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.206.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.206.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.207.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.207.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.207.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.208.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.208.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.208.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.209.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.209.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.209.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.210.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.210.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.210.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.211.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.211.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.211.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.212.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.212.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.212.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.213.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.213.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.213.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.214.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.214.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.214.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.215.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.215.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.215.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.216.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.216.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.216.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.217.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.217.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.217.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.218.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.218.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.218.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.219.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.219.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.219.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.220.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.220.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.220.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.221.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.221.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.221.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.222.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.222.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.222.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.223.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.223.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.223.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.224.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.224.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.224.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.225.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.225.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.225.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.226.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.226.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.226.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.227.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.227.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.227.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.228.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.228.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.228.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.229.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.229.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.229.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.230.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.230.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.230.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.231.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.231.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.231.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.232.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.232.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.232.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.233.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.233.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.233.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.234.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.234.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.234.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.235.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.235.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.235.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.236.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.236.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.236.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.237.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.237.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.237.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.238.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.238.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.238.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.239.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.239.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.239.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.240.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.240.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.240.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.241.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.241.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.241.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.242.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.242.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.242.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.243.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.243.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.243.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.244.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.244.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.244.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.245.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.245.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.245.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.246.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.246.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.246.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.247.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.247.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.247.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.248.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.248.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.248.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.249.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.249.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.249.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.250.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.250.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.250.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.251.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.251.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.251.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.252.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.252.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.252.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.253.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.253.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.253.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.254.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.254.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.254.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.255.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.255.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.255.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.input_layernorm.weight": "model-00075-of-000163.safetensors", + "model.layers.29.post_attention_layernorm.weight": "model-00075-of-000163.safetensors", + "model.layers.30.self_attn.q_a_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.self_attn.q_a_layernorm.weight": "model-00075-of-000163.safetensors", + "model.layers.30.self_attn.q_b_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.self_attn.kv_a_proj_with_mqa.weight": "model-00075-of-000163.safetensors", + "model.layers.30.self_attn.kv_a_layernorm.weight": "model-00075-of-000163.safetensors", + "model.layers.30.self_attn.kv_b_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.self_attn.o_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.gate.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.gate.e_score_correction_bias": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.shared_experts.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.shared_experts.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.shared_experts.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.0.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.0.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.0.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.1.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.1.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.1.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.2.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.2.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.2.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.3.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.3.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.3.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.4.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.4.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.4.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.5.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.5.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.5.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.6.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.6.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.6.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.7.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.7.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.7.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.8.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.8.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.8.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.9.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.9.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.9.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.10.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.10.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.10.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.11.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.11.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.11.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.12.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.12.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.12.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.13.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.13.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.13.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.14.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.14.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.14.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.15.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.15.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.15.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.16.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.16.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.16.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.17.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.17.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.17.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.18.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.18.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.18.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.19.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.19.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.19.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.20.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.20.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.20.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.21.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.21.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.21.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.22.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.22.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.22.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.23.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.23.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.23.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.24.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.24.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.24.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.25.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.25.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.25.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.26.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.26.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.26.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.27.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.27.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.27.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.28.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.28.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.28.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.29.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.29.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.29.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.30.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.30.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.30.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.31.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.31.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.31.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.32.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.32.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.32.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.33.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.33.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.33.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.34.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.34.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.34.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.35.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.35.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.35.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.36.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.36.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.36.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.37.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.37.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.37.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.38.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.38.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.38.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.39.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.39.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.39.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.40.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.40.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.40.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.41.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.41.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.41.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.42.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.42.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.42.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.43.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.43.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.43.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.44.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.44.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.44.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.45.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.45.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.45.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.46.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.46.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.46.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.47.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.47.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.47.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.48.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.48.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.48.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.49.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.49.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.49.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.50.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.50.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.50.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.51.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.51.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.51.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.52.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.52.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.52.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.53.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.53.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.53.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.54.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.54.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.54.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.55.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.55.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.55.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.56.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.56.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.56.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.57.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.57.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.57.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.58.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.58.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.58.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.59.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.59.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.59.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.60.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.60.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.60.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.61.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.61.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.61.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.62.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.62.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.62.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.63.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.63.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.63.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.64.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.64.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.64.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.65.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.65.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.65.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.66.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.66.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.66.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.67.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.67.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.67.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.68.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.68.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.68.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.69.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.69.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.69.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.70.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.70.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.70.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.71.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.71.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.71.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.72.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.72.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.72.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.73.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.73.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.73.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.74.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.74.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.74.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.75.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.75.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.75.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.76.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.76.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.76.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.77.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.77.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.77.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.78.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.78.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.78.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.79.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.79.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.79.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.80.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.80.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.80.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.81.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.81.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.81.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.82.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.82.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.82.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.83.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.83.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.83.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.84.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.84.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.84.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.85.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.85.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.85.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.86.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.86.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.86.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.87.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.87.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.87.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.88.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.88.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.88.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.89.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.89.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.89.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.90.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.90.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.90.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.91.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.91.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.91.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.92.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.92.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.92.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.93.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.93.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.93.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.94.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.94.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.94.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.95.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.95.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.95.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.96.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.96.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.96.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.97.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.97.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.97.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.98.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.98.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.98.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.99.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.99.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.99.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.100.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.100.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.100.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.101.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.101.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.101.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.102.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.102.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.102.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.103.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.103.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.103.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.104.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.104.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.104.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.105.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.105.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.105.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.106.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.106.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.106.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.107.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.107.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.107.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.108.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.108.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.108.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.109.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.109.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.109.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.110.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.110.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.110.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.111.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.111.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.111.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.112.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.112.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.112.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.113.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.113.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.113.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.114.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.114.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.114.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.115.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.115.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.115.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.116.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.116.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.116.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.117.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.117.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.117.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.118.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.118.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.118.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.119.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.119.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.119.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.120.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.120.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.120.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.121.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.121.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.121.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.122.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.122.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.122.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.123.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.123.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.123.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.124.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.124.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.124.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.125.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.125.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.125.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.126.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.126.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.126.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.127.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.127.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.127.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.128.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.128.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.128.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.129.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.129.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.129.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.130.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.130.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.130.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.131.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.131.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.131.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.132.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.132.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.132.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.133.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.133.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.133.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.134.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.134.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.134.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.135.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.135.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.135.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.136.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.136.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.136.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.137.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.137.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.137.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.138.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.138.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.138.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.139.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.139.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.139.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.140.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.140.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.140.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.141.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.141.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.141.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.142.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.142.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.142.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.143.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.143.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.143.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.144.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.144.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.144.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.145.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.145.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.145.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.146.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.146.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.146.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.147.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.147.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.147.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.148.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.148.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.148.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.149.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.149.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.149.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.150.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.150.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.150.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.151.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.151.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.151.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.152.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.152.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.152.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.153.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.153.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.153.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.154.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.154.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.154.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.155.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.155.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.155.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.156.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.156.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.156.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.157.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.157.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.157.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.158.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.158.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.158.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.159.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.159.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.159.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.160.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.160.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.160.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.161.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.161.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.161.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.162.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.162.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.162.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.163.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.163.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.163.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.164.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.164.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.164.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.165.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.165.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.165.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.166.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.166.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.166.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.167.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.167.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.167.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.168.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.168.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.168.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.169.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.169.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.169.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.170.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.170.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.170.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.171.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.171.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.171.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.172.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.172.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.172.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.173.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.173.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.173.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.174.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.174.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.174.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.175.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.175.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.175.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.176.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.176.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.176.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.177.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.177.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.177.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.178.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.178.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.178.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.179.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.179.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.179.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.180.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.180.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.180.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.181.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.181.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.181.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.182.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.182.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.182.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.183.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.183.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.183.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.184.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.184.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.184.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.185.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.185.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.185.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.186.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.186.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.186.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.187.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.187.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.187.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.188.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.188.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.188.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.189.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.189.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.189.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.190.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.190.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.190.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.191.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.191.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.191.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.192.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.192.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.192.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.193.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.193.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.193.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.194.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.194.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.194.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.195.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.195.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.195.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.196.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.196.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.196.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.197.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.197.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.197.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.198.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.198.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.198.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.199.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.199.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.199.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.200.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.200.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.200.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.201.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.201.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.201.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.202.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.202.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.202.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.203.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.203.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.203.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.204.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.204.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.204.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.205.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.205.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.205.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.206.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.206.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.206.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.207.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.207.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.207.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.208.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.208.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.208.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.209.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.209.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.209.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.210.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.210.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.210.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.211.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.211.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.211.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.212.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.212.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.212.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.213.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.213.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.213.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.214.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.214.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.214.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.215.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.215.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.215.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.216.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.216.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.216.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.217.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.217.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.217.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.218.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.218.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.218.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.219.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.219.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.219.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.220.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.220.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.220.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.221.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.221.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.221.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.222.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.222.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.222.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.223.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.223.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.223.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.224.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.224.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.224.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.225.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.225.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.225.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.226.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.226.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.226.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.227.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.227.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.227.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.228.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.228.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.228.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.229.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.229.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.229.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.230.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.230.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.230.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.231.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.231.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.231.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.232.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.232.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.232.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.233.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.233.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.233.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.234.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.234.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.234.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.235.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.235.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.235.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.236.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.236.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.236.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.237.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.237.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.237.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.238.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.238.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.238.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.239.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.239.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.239.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.240.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.240.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.240.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.241.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.241.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.241.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.242.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.242.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.242.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.243.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.243.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.243.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.244.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.244.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.244.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.245.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.245.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.245.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.246.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.246.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.246.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.247.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.247.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.247.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.248.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.248.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.248.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.249.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.249.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.249.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.250.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.250.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.250.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.251.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.251.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.251.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.252.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.252.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.252.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.253.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.253.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.253.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.254.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.254.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.254.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.255.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.255.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.255.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.input_layernorm.weight": "model-00078-of-000163.safetensors", + "model.layers.30.post_attention_layernorm.weight": "model-00078-of-000163.safetensors", + "model.layers.31.self_attn.q_a_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.self_attn.q_a_layernorm.weight": "model-00079-of-000163.safetensors", + "model.layers.31.self_attn.q_b_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.self_attn.kv_a_proj_with_mqa.weight": "model-00079-of-000163.safetensors", + "model.layers.31.self_attn.kv_a_layernorm.weight": "model-00079-of-000163.safetensors", + "model.layers.31.self_attn.kv_b_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.self_attn.o_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.gate.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.gate.e_score_correction_bias": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.shared_experts.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.shared_experts.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.shared_experts.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.0.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.0.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.0.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.1.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.1.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.1.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.2.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.2.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.2.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.3.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.3.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.3.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.4.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.4.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.4.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.5.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.5.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.5.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.6.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.6.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.6.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.7.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.7.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.7.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.8.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.8.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.8.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.9.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.9.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.9.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.10.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.10.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.10.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.11.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.11.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.11.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.12.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.12.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.12.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.13.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.13.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.13.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.14.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.14.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.14.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.15.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.15.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.15.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.16.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.16.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.16.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.17.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.17.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.17.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.18.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.18.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.18.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.19.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.19.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.19.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.20.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.20.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.20.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.21.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.21.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.21.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.22.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.22.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.22.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.23.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.23.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.23.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.24.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.24.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.24.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.25.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.25.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.25.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.26.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.26.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.26.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.27.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.27.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.27.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.28.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.28.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.28.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.29.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.29.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.29.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.30.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.30.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.30.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.31.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.31.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.31.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.32.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.32.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.32.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.33.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.33.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.33.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.34.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.34.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.34.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.35.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.35.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.35.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.36.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.36.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.36.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.37.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.37.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.37.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.38.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.38.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.38.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.39.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.39.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.39.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.40.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.40.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.40.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.41.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.41.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.41.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.42.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.42.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.42.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.43.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.43.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.43.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.44.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.44.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.44.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.45.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.45.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.45.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.46.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.46.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.46.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.47.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.47.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.47.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.48.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.48.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.48.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.49.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.49.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.49.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.50.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.50.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.50.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.51.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.51.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.51.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.52.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.52.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.52.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.53.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.53.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.53.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.54.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.54.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.54.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.55.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.55.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.55.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.56.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.56.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.56.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.57.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.57.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.57.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.58.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.58.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.58.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.59.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.59.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.59.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.60.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.60.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.60.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.61.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.61.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.61.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.62.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.62.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.62.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.63.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.63.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.63.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.64.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.64.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.64.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.65.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.65.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.65.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.66.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.66.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.66.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.67.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.67.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.67.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.68.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.68.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.68.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.69.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.69.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.69.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.70.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.70.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.70.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.71.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.71.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.71.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.72.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.72.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.72.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.73.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.73.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.73.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.74.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.74.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.74.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.75.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.75.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.75.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.76.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.76.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.76.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.77.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.77.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.77.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.78.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.78.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.78.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.79.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.79.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.79.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.80.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.80.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.80.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.81.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.81.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.81.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.82.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.82.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.82.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.83.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.83.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.83.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.84.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.84.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.84.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.85.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.85.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.85.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.86.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.86.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.86.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.87.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.87.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.87.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.88.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.88.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.88.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.89.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.89.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.89.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.90.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.90.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.90.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.91.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.91.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.91.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.92.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.92.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.92.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.93.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.93.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.93.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.94.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.94.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.94.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.95.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.95.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.95.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.96.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.96.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.96.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.97.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.97.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.97.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.98.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.98.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.98.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.99.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.99.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.99.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.100.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.100.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.100.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.101.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.101.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.101.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.102.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.102.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.102.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.103.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.103.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.103.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.104.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.104.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.104.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.105.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.105.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.105.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.106.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.106.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.106.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.107.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.107.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.107.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.108.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.108.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.108.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.109.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.109.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.109.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.110.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.110.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.110.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.111.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.111.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.111.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.112.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.112.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.112.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.113.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.113.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.113.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.114.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.114.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.114.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.115.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.115.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.115.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.116.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.116.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.116.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.117.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.117.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.117.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.118.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.118.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.118.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.119.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.119.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.119.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.120.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.120.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.120.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.121.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.121.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.121.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.122.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.122.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.122.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.123.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.123.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.123.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.124.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.124.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.124.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.125.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.125.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.125.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.126.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.126.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.126.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.127.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.127.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.127.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.128.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.128.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.128.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.129.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.129.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.129.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.130.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.130.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.130.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.131.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.131.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.131.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.132.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.132.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.132.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.133.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.133.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.133.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.134.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.134.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.134.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.135.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.135.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.135.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.136.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.136.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.136.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.137.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.137.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.137.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.138.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.138.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.138.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.139.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.139.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.139.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.140.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.140.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.140.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.141.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.141.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.141.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.142.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.142.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.142.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.143.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.143.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.143.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.144.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.144.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.144.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.145.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.145.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.145.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.146.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.146.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.146.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.147.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.147.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.147.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.148.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.148.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.148.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.149.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.149.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.149.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.150.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.150.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.150.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.151.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.151.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.151.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.152.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.152.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.152.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.153.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.153.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.153.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.154.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.154.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.154.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.155.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.155.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.155.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.156.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.156.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.156.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.157.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.157.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.157.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.158.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.158.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.158.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.159.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.159.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.159.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.160.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.160.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.160.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.161.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.161.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.161.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.162.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.162.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.162.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.163.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.163.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.163.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.164.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.164.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.164.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.165.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.165.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.165.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.166.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.166.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.166.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.167.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.167.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.167.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.168.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.168.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.168.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.169.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.169.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.169.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.170.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.170.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.170.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.171.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.171.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.171.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.172.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.172.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.172.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.173.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.173.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.173.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.174.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.174.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.174.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.175.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.175.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.175.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.176.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.176.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.176.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.177.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.177.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.177.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.178.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.178.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.178.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.179.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.179.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.179.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.180.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.180.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.180.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.181.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.181.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.181.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.182.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.182.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.182.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.183.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.183.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.183.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.184.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.184.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.184.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.185.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.185.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.185.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.186.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.186.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.186.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.187.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.187.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.187.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.188.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.188.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.188.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.189.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.189.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.189.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.190.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.190.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.190.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.191.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.191.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.191.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.192.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.192.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.192.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.193.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.193.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.193.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.194.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.194.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.194.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.195.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.195.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.195.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.196.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.196.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.196.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.197.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.197.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.197.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.198.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.198.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.198.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.199.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.199.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.199.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.200.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.200.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.200.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.201.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.201.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.201.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.202.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.202.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.202.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.203.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.203.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.203.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.204.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.204.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.204.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.205.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.205.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.205.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.206.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.206.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.206.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.207.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.207.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.207.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.208.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.208.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.208.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.209.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.209.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.209.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.210.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.210.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.210.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.211.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.211.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.211.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.212.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.212.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.212.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.213.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.213.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.213.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.214.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.214.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.214.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.215.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.215.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.215.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.216.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.216.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.216.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.217.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.217.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.217.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.218.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.218.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.218.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.219.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.219.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.219.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.220.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.220.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.220.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.221.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.221.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.221.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.222.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.222.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.222.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.223.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.223.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.223.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.224.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.224.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.224.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.225.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.225.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.225.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.226.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.226.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.226.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.227.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.227.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.227.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.228.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.228.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.228.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.229.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.229.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.229.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.230.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.230.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.230.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.231.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.231.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.231.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.232.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.232.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.232.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.233.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.233.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.233.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.234.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.234.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.234.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.235.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.235.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.235.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.236.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.236.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.236.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.237.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.237.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.237.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.238.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.238.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.238.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.239.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.239.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.239.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.240.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.240.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.240.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.241.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.241.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.241.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.242.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.242.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.242.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.243.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.243.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.243.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.244.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.244.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.244.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.245.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.245.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.245.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.246.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.246.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.246.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.247.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.247.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.247.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.248.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.248.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.248.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.249.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.249.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.249.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.250.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.250.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.250.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.251.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.251.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.251.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.252.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.252.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.252.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.253.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.253.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.253.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.254.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.254.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.254.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.255.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.255.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.255.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.input_layernorm.weight": "model-00081-of-000163.safetensors", + "model.layers.31.post_attention_layernorm.weight": "model-00081-of-000163.safetensors", + "model.layers.32.self_attn.q_a_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.self_attn.q_a_layernorm.weight": "model-00081-of-000163.safetensors", + "model.layers.32.self_attn.q_b_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.self_attn.kv_a_proj_with_mqa.weight": "model-00081-of-000163.safetensors", + "model.layers.32.self_attn.kv_a_layernorm.weight": "model-00081-of-000163.safetensors", + "model.layers.32.self_attn.kv_b_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.self_attn.o_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.gate.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.gate.e_score_correction_bias": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.shared_experts.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.shared_experts.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.shared_experts.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.0.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.0.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.0.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.1.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.1.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.1.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.2.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.2.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.2.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.3.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.3.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.3.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.4.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.4.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.4.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.5.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.5.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.5.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.6.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.6.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.6.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.7.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.7.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.7.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.8.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.8.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.8.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.9.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.9.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.9.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.10.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.10.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.10.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.11.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.11.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.11.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.12.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.12.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.12.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.13.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.13.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.13.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.14.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.14.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.14.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.15.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.15.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.15.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.16.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.16.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.16.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.17.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.17.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.17.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.18.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.18.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.18.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.19.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.19.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.19.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.20.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.20.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.20.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.21.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.21.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.21.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.22.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.22.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.22.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.23.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.23.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.23.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.24.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.24.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.24.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.25.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.25.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.25.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.26.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.26.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.26.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.27.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.27.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.27.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.28.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.28.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.28.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.29.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.29.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.29.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.30.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.30.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.30.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.31.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.31.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.31.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.32.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.32.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.32.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.33.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.33.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.33.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.34.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.34.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.34.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.35.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.35.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.35.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.36.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.36.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.36.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.37.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.37.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.37.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.38.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.38.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.38.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.39.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.39.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.39.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.40.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.40.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.40.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.41.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.41.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.41.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.42.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.42.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.42.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.43.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.43.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.43.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.44.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.44.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.44.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.45.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.45.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.45.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.46.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.46.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.46.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.47.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.47.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.47.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.48.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.48.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.48.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.49.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.49.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.49.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.50.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.50.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.50.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.51.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.51.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.51.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.52.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.52.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.52.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.53.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.53.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.53.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.54.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.54.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.54.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.55.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.55.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.55.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.56.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.56.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.56.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.57.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.57.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.57.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.58.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.58.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.58.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.59.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.59.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.59.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.60.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.60.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.60.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.61.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.61.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.61.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.62.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.62.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.62.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.63.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.63.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.63.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.64.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.64.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.64.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.65.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.65.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.65.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.66.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.66.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.66.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.67.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.67.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.67.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.68.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.68.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.68.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.69.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.69.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.69.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.70.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.70.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.70.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.71.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.71.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.71.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.72.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.72.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.72.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.73.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.73.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.73.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.74.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.74.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.74.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.75.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.75.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.75.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.76.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.76.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.76.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.77.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.77.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.77.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.78.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.78.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.78.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.79.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.79.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.79.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.80.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.80.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.80.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.81.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.81.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.81.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.82.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.82.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.82.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.83.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.83.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.83.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.84.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.84.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.84.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.85.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.85.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.85.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.86.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.86.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.86.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.87.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.87.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.87.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.88.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.88.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.88.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.89.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.89.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.89.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.90.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.90.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.90.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.91.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.91.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.91.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.92.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.92.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.92.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.93.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.93.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.93.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.94.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.94.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.94.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.95.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.95.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.95.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.96.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.96.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.96.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.97.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.97.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.97.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.98.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.98.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.98.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.99.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.99.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.99.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.100.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.100.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.100.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.101.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.101.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.101.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.102.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.102.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.102.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.103.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.103.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.103.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.104.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.104.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.104.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.105.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.105.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.105.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.106.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.106.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.106.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.107.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.107.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.107.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.108.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.108.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.108.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.109.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.109.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.109.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.110.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.110.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.110.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.111.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.111.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.111.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.112.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.112.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.112.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.113.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.113.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.113.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.114.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.114.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.114.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.115.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.115.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.115.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.116.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.116.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.116.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.117.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.117.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.117.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.118.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.118.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.118.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.119.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.119.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.119.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.120.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.120.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.120.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.121.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.121.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.121.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.122.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.122.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.122.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.123.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.123.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.123.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.124.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.124.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.124.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.125.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.125.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.125.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.126.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.126.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.126.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.127.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.127.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.127.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.128.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.128.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.128.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.129.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.129.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.129.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.130.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.130.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.130.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.131.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.131.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.131.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.132.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.132.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.132.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.133.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.133.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.133.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.134.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.134.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.134.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.135.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.135.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.135.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.136.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.136.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.136.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.137.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.137.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.137.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.138.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.138.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.138.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.139.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.139.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.139.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.140.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.140.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.140.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.141.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.141.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.141.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.142.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.142.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.142.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.143.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.143.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.143.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.144.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.144.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.144.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.145.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.145.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.145.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.146.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.146.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.146.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.147.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.147.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.147.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.148.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.148.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.148.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.149.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.149.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.149.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.150.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.150.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.150.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.151.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.151.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.151.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.152.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.152.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.152.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.153.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.153.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.153.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.154.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.154.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.154.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.155.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.155.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.155.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.156.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.156.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.156.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.157.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.157.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.157.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.158.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.158.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.158.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.159.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.159.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.159.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.160.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.160.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.160.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.161.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.161.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.161.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.162.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.162.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.162.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.163.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.163.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.163.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.164.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.164.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.164.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.165.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.165.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.165.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.166.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.166.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.166.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.167.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.167.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.167.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.168.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.168.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.168.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.169.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.169.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.169.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.170.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.170.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.170.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.171.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.171.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.171.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.172.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.172.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.172.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.173.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.173.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.173.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.174.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.174.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.174.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.175.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.175.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.175.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.176.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.176.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.176.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.177.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.177.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.177.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.178.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.178.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.178.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.179.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.179.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.179.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.180.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.180.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.180.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.181.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.181.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.181.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.182.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.182.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.182.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.183.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.183.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.183.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.184.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.184.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.184.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.185.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.185.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.185.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.186.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.186.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.186.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.187.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.187.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.187.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.188.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.188.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.188.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.189.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.189.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.189.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.190.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.190.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.190.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.191.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.191.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.191.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.192.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.192.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.192.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.193.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.193.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.193.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.194.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.194.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.194.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.195.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.195.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.195.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.196.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.196.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.196.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.197.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.197.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.197.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.198.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.198.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.198.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.199.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.199.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.199.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.200.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.200.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.200.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.201.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.201.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.201.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.202.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.202.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.202.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.203.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.203.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.203.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.204.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.204.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.204.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.205.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.205.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.205.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.206.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.206.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.206.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.207.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.207.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.207.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.208.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.208.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.208.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.209.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.209.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.209.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.210.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.210.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.210.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.211.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.211.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.211.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.212.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.212.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.212.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.213.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.213.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.213.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.214.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.214.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.214.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.215.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.215.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.215.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.216.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.216.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.216.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.217.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.217.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.217.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.218.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.218.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.218.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.219.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.219.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.219.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.220.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.220.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.220.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.221.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.221.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.221.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.222.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.222.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.222.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.223.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.223.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.223.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.224.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.224.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.224.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.225.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.225.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.225.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.226.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.226.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.226.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.227.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.227.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.227.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.228.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.228.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.228.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.229.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.229.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.229.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.230.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.230.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.230.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.231.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.231.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.231.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.232.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.232.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.232.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.233.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.233.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.233.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.234.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.234.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.234.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.235.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.235.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.235.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.236.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.236.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.236.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.237.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.237.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.237.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.238.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.238.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.238.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.239.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.239.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.239.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.240.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.240.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.240.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.241.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.241.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.241.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.242.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.242.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.242.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.243.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.243.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.243.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.244.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.244.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.244.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.245.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.245.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.245.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.246.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.246.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.246.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.247.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.247.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.247.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.248.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.248.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.248.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.249.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.249.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.249.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.250.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.250.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.250.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.251.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.251.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.251.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.252.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.252.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.252.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.253.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.253.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.253.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.254.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.254.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.254.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.255.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.255.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.255.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.input_layernorm.weight": "model-00084-of-000163.safetensors", + "model.layers.32.post_attention_layernorm.weight": "model-00084-of-000163.safetensors", + "model.layers.33.self_attn.q_a_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.self_attn.q_a_layernorm.weight": "model-00084-of-000163.safetensors", + "model.layers.33.self_attn.q_b_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.self_attn.kv_a_proj_with_mqa.weight": "model-00084-of-000163.safetensors", + "model.layers.33.self_attn.kv_a_layernorm.weight": "model-00084-of-000163.safetensors", + "model.layers.33.self_attn.kv_b_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.self_attn.o_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.gate.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.gate.e_score_correction_bias": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.shared_experts.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.shared_experts.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.shared_experts.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.0.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.0.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.0.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.1.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.1.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.1.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.2.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.2.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.2.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.3.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.3.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.3.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.4.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.4.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.4.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.5.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.5.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.5.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.6.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.6.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.6.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.7.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.7.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.7.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.8.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.8.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.8.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.9.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.9.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.9.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.10.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.10.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.10.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.11.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.11.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.11.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.12.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.12.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.12.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.13.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.13.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.13.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.14.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.14.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.14.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.15.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.15.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.15.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.16.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.16.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.16.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.17.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.17.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.17.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.18.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.18.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.18.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.19.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.19.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.19.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.20.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.20.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.20.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.21.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.21.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.21.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.22.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.22.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.22.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.23.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.23.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.23.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.24.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.24.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.24.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.25.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.25.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.25.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.26.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.26.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.26.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.27.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.27.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.27.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.28.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.28.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.28.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.29.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.29.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.29.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.30.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.30.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.30.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.31.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.31.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.31.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.32.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.32.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.32.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.33.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.33.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.33.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.34.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.34.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.34.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.35.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.35.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.35.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.36.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.36.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.36.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.37.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.37.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.37.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.38.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.38.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.38.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.39.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.39.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.39.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.40.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.40.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.40.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.41.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.41.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.41.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.42.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.42.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.42.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.43.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.43.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.43.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.44.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.44.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.44.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.45.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.45.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.45.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.46.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.46.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.46.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.47.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.47.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.47.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.48.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.48.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.48.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.49.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.49.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.49.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.50.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.50.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.50.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.51.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.51.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.51.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.52.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.52.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.52.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.53.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.53.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.53.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.54.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.54.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.54.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.55.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.55.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.55.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.56.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.56.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.56.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.57.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.57.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.57.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.58.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.58.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.58.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.59.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.59.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.59.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.60.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.60.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.60.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.61.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.61.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.61.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.62.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.62.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.62.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.63.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.63.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.63.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.64.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.64.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.64.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.65.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.65.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.65.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.66.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.66.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.66.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.67.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.67.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.67.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.68.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.68.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.68.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.69.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.69.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.69.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.70.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.70.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.70.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.71.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.71.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.71.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.72.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.72.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.72.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.73.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.73.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.73.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.74.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.74.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.74.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.75.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.75.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.75.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.76.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.76.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.76.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.77.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.77.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.77.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.78.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.78.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.78.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.79.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.79.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.79.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.80.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.80.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.80.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.81.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.81.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.81.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.82.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.82.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.82.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.83.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.83.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.83.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.84.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.84.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.84.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.85.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.85.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.85.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.86.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.86.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.86.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.87.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.87.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.87.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.88.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.88.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.88.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.89.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.89.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.89.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.90.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.90.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.90.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.91.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.91.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.91.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.92.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.92.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.92.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.93.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.93.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.93.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.94.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.94.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.94.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.95.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.95.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.95.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.96.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.96.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.96.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.97.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.97.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.97.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.98.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.98.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.98.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.99.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.99.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.99.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.100.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.100.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.100.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.101.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.101.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.101.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.102.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.102.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.102.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.103.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.103.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.103.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.104.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.104.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.104.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.105.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.105.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.105.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.106.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.106.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.106.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.107.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.107.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.107.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.108.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.108.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.108.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.109.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.109.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.109.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.110.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.110.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.110.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.111.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.111.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.111.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.112.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.112.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.112.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.113.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.113.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.113.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.114.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.114.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.114.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.115.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.115.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.115.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.116.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.116.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.116.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.117.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.117.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.117.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.118.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.118.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.118.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.119.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.119.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.119.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.120.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.120.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.120.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.121.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.121.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.121.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.122.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.122.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.122.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.123.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.123.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.123.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.124.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.124.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.124.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.125.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.125.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.125.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.126.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.126.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.126.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.127.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.127.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.127.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.128.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.128.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.128.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.129.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.129.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.129.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.130.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.130.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.130.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.131.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.131.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.131.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.132.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.132.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.132.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.133.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.133.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.133.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.134.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.134.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.134.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.135.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.135.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.135.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.136.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.136.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.136.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.137.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.137.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.137.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.138.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.138.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.138.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.139.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.139.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.139.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.140.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.140.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.140.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.141.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.141.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.141.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.142.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.142.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.142.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.143.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.143.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.143.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.144.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.144.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.144.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.145.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.145.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.145.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.146.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.146.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.146.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.147.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.147.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.147.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.148.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.148.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.148.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.149.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.149.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.149.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.150.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.150.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.150.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.151.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.151.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.151.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.152.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.152.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.152.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.153.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.153.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.153.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.154.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.154.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.154.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.155.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.155.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.155.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.156.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.156.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.156.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.157.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.157.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.157.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.158.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.158.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.158.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.159.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.159.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.159.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.160.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.160.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.160.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.161.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.161.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.161.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.162.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.162.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.162.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.163.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.163.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.163.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.164.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.164.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.164.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.165.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.165.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.165.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.166.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.166.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.166.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.167.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.167.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.167.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.168.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.168.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.168.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.169.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.169.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.169.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.170.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.170.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.170.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.171.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.171.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.171.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.172.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.172.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.172.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.173.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.173.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.173.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.174.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.174.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.174.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.175.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.175.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.175.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.176.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.176.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.176.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.177.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.177.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.177.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.178.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.178.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.178.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.179.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.179.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.179.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.180.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.180.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.180.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.181.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.181.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.181.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.182.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.182.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.182.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.183.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.183.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.183.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.184.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.184.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.184.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.185.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.185.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.185.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.186.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.186.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.186.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.187.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.187.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.187.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.188.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.188.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.188.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.189.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.189.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.189.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.190.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.190.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.190.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.191.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.191.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.191.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.192.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.192.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.192.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.193.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.193.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.193.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.194.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.194.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.194.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.195.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.195.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.195.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.196.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.196.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.196.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.197.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.197.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.197.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.198.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.198.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.198.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.199.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.199.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.199.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.200.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.200.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.200.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.201.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.201.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.201.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.202.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.202.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.202.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.203.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.203.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.203.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.204.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.204.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.204.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.205.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.205.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.205.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.206.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.206.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.206.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.207.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.207.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.207.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.208.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.208.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.208.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.209.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.209.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.209.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.210.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.210.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.210.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.211.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.211.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.211.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.212.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.212.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.212.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.213.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.213.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.213.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.214.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.214.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.214.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.215.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.215.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.215.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.216.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.216.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.216.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.217.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.217.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.217.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.218.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.218.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.218.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.219.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.219.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.219.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.220.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.220.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.220.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.221.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.221.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.221.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.222.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.222.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.222.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.223.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.223.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.223.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.224.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.224.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.224.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.225.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.225.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.225.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.226.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.226.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.226.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.227.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.227.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.227.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.228.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.228.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.228.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.229.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.229.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.229.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.230.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.230.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.230.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.231.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.231.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.231.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.232.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.232.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.232.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.233.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.233.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.233.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.234.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.234.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.234.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.235.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.235.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.235.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.236.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.236.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.236.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.237.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.237.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.237.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.238.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.238.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.238.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.239.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.239.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.239.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.240.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.240.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.240.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.241.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.241.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.241.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.242.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.242.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.242.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.243.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.243.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.243.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.244.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.244.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.244.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.245.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.245.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.245.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.246.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.246.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.246.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.247.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.247.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.247.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.248.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.248.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.248.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.249.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.249.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.249.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.250.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.250.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.250.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.251.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.251.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.251.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.252.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.252.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.252.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.253.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.253.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.33.mlp.experts.253.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.33.mlp.experts.254.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.33.mlp.experts.254.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.33.mlp.experts.254.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.33.mlp.experts.255.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.33.mlp.experts.255.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.33.mlp.experts.255.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.33.input_layernorm.weight": "model-00087-of-000163.safetensors", + "model.layers.33.post_attention_layernorm.weight": "model-00087-of-000163.safetensors", + "model.layers.34.self_attn.q_a_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.self_attn.q_a_layernorm.weight": "model-00087-of-000163.safetensors", + "model.layers.34.self_attn.q_b_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.self_attn.kv_a_proj_with_mqa.weight": "model-00087-of-000163.safetensors", + "model.layers.34.self_attn.kv_a_layernorm.weight": "model-00087-of-000163.safetensors", + "model.layers.34.self_attn.kv_b_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.self_attn.o_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.gate.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.gate.e_score_correction_bias": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.shared_experts.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.shared_experts.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.shared_experts.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.0.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.0.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.0.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.1.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.1.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.1.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.2.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.2.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.2.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.3.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.3.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.3.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.4.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.4.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.4.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.5.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.5.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.5.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.6.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.6.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.6.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.7.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.7.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.7.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.8.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.8.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.8.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.9.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.9.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.9.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.10.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.10.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.10.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.11.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.11.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.11.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.12.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.12.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.12.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.13.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.13.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.13.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.14.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.14.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.14.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.15.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.15.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.15.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.16.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.16.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.16.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.17.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.17.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.17.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.18.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.18.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.18.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.19.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.19.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.19.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.20.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.20.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.20.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.21.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.21.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.21.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.22.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.22.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.22.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.23.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.23.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.23.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.24.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.24.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.24.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.25.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.25.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.25.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.26.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.26.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.26.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.27.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.27.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.27.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.28.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.28.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.28.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.29.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.29.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.29.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.30.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.30.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.30.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.31.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.31.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.31.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.32.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.32.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.32.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.33.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.33.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.33.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.34.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.34.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.34.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.35.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.35.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.35.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.36.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.36.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.36.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.37.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.37.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.37.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.38.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.38.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.38.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.39.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.39.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.39.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.40.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.40.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.40.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.41.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.41.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.41.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.42.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.42.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.42.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.43.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.43.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.43.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.44.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.44.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.44.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.45.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.45.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.45.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.46.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.46.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.46.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.47.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.47.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.47.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.48.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.48.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.48.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.49.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.49.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.49.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.50.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.50.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.50.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.51.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.51.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.51.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.52.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.52.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.52.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.53.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.53.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.53.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.54.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.54.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.54.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.55.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.55.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.55.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.56.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.56.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.56.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.57.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.57.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.57.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.58.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.58.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.58.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.59.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.59.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.59.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.60.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.60.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.60.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.61.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.61.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.61.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.62.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.62.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.62.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.63.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.63.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.63.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.64.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.64.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.64.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.65.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.65.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.65.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.66.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.66.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.66.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.67.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.67.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.67.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.68.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.68.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.68.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.69.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.69.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.69.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.70.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.70.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.70.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.71.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.71.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.71.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.72.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.72.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.72.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.73.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.73.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.73.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.74.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.74.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.74.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.75.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.75.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.75.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.76.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.76.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.76.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.77.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.77.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.77.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.78.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.78.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.78.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.79.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.79.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.79.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.80.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.80.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.80.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.81.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.81.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.81.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.82.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.82.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.82.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.83.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.83.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.83.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.84.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.84.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.84.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.85.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.85.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.85.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.86.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.86.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.86.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.87.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.87.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.87.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.88.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.88.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.88.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.89.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.89.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.89.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.90.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.90.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.90.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.91.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.91.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.91.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.92.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.92.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.92.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.93.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.93.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.93.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.94.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.94.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.94.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.95.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.95.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.95.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.96.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.96.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.96.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.97.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.97.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.97.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.98.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.98.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.98.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.99.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.99.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.99.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.100.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.100.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.100.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.101.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.101.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.101.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.102.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.102.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.102.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.103.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.103.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.103.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.104.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.104.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.104.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.105.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.105.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.105.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.106.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.106.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.106.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.107.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.107.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.107.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.108.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.108.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.108.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.109.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.109.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.109.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.110.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.110.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.110.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.111.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.111.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.111.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.112.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.112.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.112.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.113.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.113.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.113.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.114.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.114.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.114.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.115.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.115.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.115.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.116.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.116.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.116.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.117.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.117.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.117.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.118.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.118.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.118.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.119.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.119.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.119.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.120.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.120.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.120.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.121.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.121.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.121.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.122.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.122.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.122.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.123.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.123.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.123.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.124.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.124.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.124.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.125.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.125.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.125.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.126.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.126.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.126.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.127.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.127.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.127.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.128.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.128.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.128.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.129.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.129.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.129.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.130.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.130.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.130.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.131.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.131.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.131.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.132.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.132.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.132.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.133.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.133.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.133.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.134.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.134.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.134.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.135.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.135.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.135.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.136.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.136.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.136.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.137.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.137.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.137.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.138.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.138.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.138.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.139.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.139.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.139.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.140.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.140.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.140.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.141.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.141.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.141.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.142.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.142.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.142.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.143.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.143.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.143.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.144.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.144.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.144.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.145.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.145.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.145.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.146.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.146.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.146.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.147.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.147.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.147.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.148.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.148.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.148.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.149.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.149.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.149.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.150.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.150.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.150.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.151.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.151.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.151.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.152.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.152.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.152.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.153.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.153.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.153.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.154.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.154.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.154.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.155.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.155.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.155.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.156.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.156.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.156.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.157.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.157.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.157.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.158.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.158.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.158.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.159.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.159.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.159.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.160.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.160.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.160.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.161.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.161.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.161.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.162.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.162.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.162.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.163.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.163.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.163.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.164.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.164.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.164.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.165.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.165.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.165.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.166.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.166.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.166.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.167.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.167.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.167.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.168.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.168.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.168.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.169.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.169.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.169.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.170.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.170.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.170.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.171.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.171.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.171.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.172.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.172.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.172.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.173.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.173.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.173.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.174.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.174.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.174.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.175.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.175.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.175.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.176.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.176.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.176.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.177.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.177.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.177.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.178.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.178.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.178.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.179.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.179.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.179.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.180.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.180.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.180.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.181.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.181.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.181.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.182.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.182.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.182.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.183.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.183.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.183.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.184.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.184.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.184.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.185.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.185.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.185.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.186.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.186.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.186.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.187.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.187.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.187.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.188.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.188.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.188.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.189.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.189.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.189.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.190.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.190.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.190.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.191.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.191.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.191.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.192.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.192.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.192.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.193.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.193.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.193.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.194.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.194.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.194.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.195.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.195.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.195.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.196.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.196.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.196.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.197.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.197.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.197.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.198.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.198.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.198.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.199.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.199.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.199.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.200.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.200.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.200.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.201.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.201.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.201.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.202.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.202.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.202.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.203.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.203.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.203.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.204.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.204.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.204.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.205.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.205.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.205.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.206.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.206.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.206.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.207.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.207.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.207.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.208.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.208.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.208.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.209.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.209.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.209.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.210.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.210.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.210.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.211.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.211.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.211.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.212.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.212.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.212.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.213.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.213.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.213.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.214.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.214.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.214.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.215.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.215.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.215.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.216.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.216.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.216.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.217.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.217.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.217.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.218.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.218.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.218.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.219.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.219.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.219.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.220.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.220.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.220.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.221.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.221.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.221.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.222.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.222.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.222.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.223.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.223.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.223.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.224.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.224.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.224.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.225.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.225.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.225.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.226.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.226.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.226.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.227.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.227.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.227.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.228.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.228.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.228.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.229.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.229.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.229.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.230.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.230.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.230.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.231.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.231.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.231.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.232.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.232.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.232.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.233.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.233.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.233.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.234.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.234.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.234.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.235.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.235.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.235.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.236.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.236.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.236.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.237.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.237.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.237.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.238.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.238.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.238.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.239.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.239.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.239.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.240.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.240.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.240.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.241.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.241.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.241.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.242.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.242.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.242.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.243.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.243.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.243.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.244.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.244.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.244.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.245.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.245.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.245.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.246.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.246.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.246.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.247.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.247.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.247.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.248.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.248.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.248.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.249.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.249.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.249.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.250.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.250.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.250.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.251.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.251.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.251.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.252.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.252.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.252.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.253.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.253.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.253.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.254.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.254.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.254.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.255.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.255.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.255.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.input_layernorm.weight": "model-00089-of-000163.safetensors", + "model.layers.34.post_attention_layernorm.weight": "model-00089-of-000163.safetensors", + "model.layers.35.self_attn.q_a_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.self_attn.q_a_layernorm.weight": "model-00089-of-000163.safetensors", + "model.layers.35.self_attn.q_b_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.self_attn.kv_a_proj_with_mqa.weight": "model-00089-of-000163.safetensors", + "model.layers.35.self_attn.kv_a_layernorm.weight": "model-00089-of-000163.safetensors", + "model.layers.35.self_attn.kv_b_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.self_attn.o_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.gate.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.gate.e_score_correction_bias": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.shared_experts.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.shared_experts.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.shared_experts.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.0.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.0.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.0.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.1.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.1.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.1.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.2.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.2.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.2.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.3.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.3.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.3.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.4.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.4.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.4.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.5.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.5.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.5.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.6.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.6.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.6.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.7.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.7.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.7.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.8.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.8.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.8.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.9.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.9.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.9.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.10.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.10.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.10.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.11.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.11.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.11.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.12.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.12.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.12.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.13.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.13.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.13.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.14.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.14.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.14.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.15.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.15.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.15.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.16.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.16.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.16.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.17.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.17.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.17.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.18.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.18.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.18.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.19.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.19.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.19.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.20.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.20.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.20.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.21.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.21.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.21.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.22.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.22.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.22.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.23.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.23.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.23.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.24.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.24.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.24.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.25.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.25.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.25.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.26.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.26.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.26.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.27.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.27.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.27.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.28.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.28.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.28.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.29.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.29.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.29.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.30.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.30.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.30.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.31.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.31.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.31.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.32.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.32.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.32.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.33.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.33.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.33.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.34.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.34.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.34.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.35.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.35.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.35.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.36.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.36.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.36.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.37.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.37.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.37.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.38.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.38.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.38.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.39.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.39.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.39.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.40.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.40.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.40.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.41.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.41.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.41.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.42.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.42.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.42.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.43.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.43.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.43.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.44.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.44.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.44.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.45.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.45.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.45.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.46.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.46.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.46.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.47.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.47.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.47.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.48.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.48.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.48.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.49.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.49.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.49.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.50.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.50.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.50.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.51.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.51.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.51.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.52.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.52.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.52.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.53.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.53.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.53.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.54.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.54.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.54.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.55.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.55.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.55.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.56.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.56.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.56.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.57.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.57.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.57.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.58.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.58.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.58.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.59.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.59.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.59.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.60.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.60.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.60.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.61.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.61.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.61.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.62.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.62.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.62.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.63.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.63.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.63.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.64.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.64.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.64.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.65.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.65.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.65.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.66.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.66.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.66.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.67.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.67.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.67.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.68.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.68.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.68.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.69.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.69.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.69.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.70.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.70.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.70.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.71.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.71.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.71.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.72.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.72.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.72.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.73.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.73.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.73.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.74.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.74.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.74.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.75.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.75.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.75.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.76.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.76.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.76.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.77.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.77.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.77.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.78.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.78.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.78.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.79.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.79.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.79.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.80.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.80.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.80.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.81.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.81.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.81.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.82.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.82.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.82.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.83.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.83.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.83.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.84.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.84.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.84.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.85.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.85.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.85.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.86.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.86.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.86.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.87.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.87.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.87.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.88.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.88.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.88.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.89.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.89.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.89.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.90.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.90.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.90.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.91.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.91.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.91.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.92.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.92.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.92.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.93.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.93.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.93.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.94.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.94.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.94.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.95.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.95.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.95.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.96.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.96.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.96.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.97.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.97.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.97.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.98.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.98.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.98.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.99.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.99.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.99.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.100.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.100.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.100.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.101.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.101.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.101.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.102.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.102.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.102.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.103.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.103.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.103.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.104.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.104.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.104.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.105.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.105.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.105.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.106.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.106.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.106.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.107.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.107.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.107.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.108.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.108.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.108.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.109.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.109.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.109.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.110.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.110.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.110.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.111.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.111.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.111.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.112.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.112.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.112.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.113.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.113.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.113.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.114.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.114.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.114.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.115.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.115.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.115.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.116.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.116.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.116.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.117.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.117.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.117.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.118.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.118.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.118.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.119.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.119.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.119.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.120.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.120.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.120.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.121.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.121.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.121.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.122.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.122.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.122.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.123.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.123.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.123.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.124.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.124.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.124.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.125.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.125.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.125.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.126.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.126.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.126.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.127.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.127.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.127.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.128.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.128.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.128.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.129.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.129.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.129.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.130.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.130.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.130.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.131.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.131.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.131.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.132.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.132.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.132.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.133.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.133.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.133.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.134.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.134.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.134.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.135.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.135.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.135.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.136.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.136.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.136.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.137.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.137.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.137.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.138.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.138.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.138.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.139.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.139.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.139.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.140.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.140.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.140.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.141.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.141.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.141.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.142.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.142.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.142.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.143.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.143.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.143.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.144.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.144.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.144.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.145.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.145.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.145.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.146.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.146.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.146.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.147.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.147.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.147.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.148.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.148.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.148.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.149.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.149.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.149.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.150.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.150.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.150.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.151.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.151.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.151.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.152.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.152.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.152.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.153.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.153.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.153.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.154.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.154.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.154.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.155.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.155.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.155.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.156.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.156.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.156.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.157.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.157.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.157.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.158.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.158.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.158.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.159.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.159.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.159.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.160.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.160.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.160.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.161.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.161.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.161.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.162.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.162.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.162.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.163.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.163.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.163.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.164.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.164.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.164.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.165.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.165.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.165.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.166.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.166.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.166.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.167.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.167.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.167.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.168.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.168.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.168.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.169.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.169.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.169.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.170.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.170.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.170.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.171.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.171.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.171.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.172.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.172.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.172.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.173.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.173.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.173.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.174.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.174.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.174.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.175.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.175.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.175.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.176.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.176.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.176.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.177.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.177.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.177.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.178.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.178.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.178.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.179.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.179.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.179.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.180.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.180.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.180.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.181.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.181.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.181.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.182.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.182.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.182.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.183.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.183.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.183.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.184.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.184.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.184.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.185.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.185.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.185.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.186.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.186.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.186.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.187.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.187.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.187.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.188.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.188.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.188.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.189.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.189.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.189.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.190.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.190.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.190.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.191.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.191.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.191.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.192.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.192.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.192.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.193.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.193.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.193.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.194.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.194.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.194.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.195.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.195.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.195.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.196.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.196.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.196.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.197.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.197.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.197.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.198.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.198.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.198.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.199.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.199.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.199.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.200.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.200.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.200.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.201.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.201.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.201.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.202.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.202.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.202.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.203.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.203.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.203.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.204.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.204.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.204.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.205.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.205.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.205.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.206.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.206.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.206.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.207.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.207.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.207.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.208.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.208.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.208.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.209.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.209.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.209.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.210.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.210.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.210.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.211.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.211.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.211.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.212.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.212.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.212.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.213.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.213.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.213.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.214.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.214.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.214.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.215.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.215.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.215.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.216.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.216.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.216.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.217.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.217.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.217.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.218.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.218.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.218.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.219.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.219.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.219.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.220.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.220.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.220.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.221.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.221.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.221.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.222.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.222.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.222.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.223.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.223.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.223.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.224.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.224.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.224.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.225.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.225.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.225.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.226.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.226.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.226.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.227.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.227.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.227.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.228.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.228.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.228.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.229.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.229.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.229.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.230.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.230.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.230.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.231.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.231.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.231.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.232.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.232.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.232.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.233.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.233.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.233.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.234.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.234.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.234.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.235.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.235.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.235.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.236.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.236.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.236.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.237.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.237.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.237.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.238.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.238.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.238.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.239.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.239.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.239.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.240.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.240.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.240.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.241.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.241.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.241.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.242.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.242.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.242.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.243.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.243.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.243.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.244.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.244.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.244.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.245.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.245.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.245.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.246.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.246.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.246.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.247.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.247.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.247.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.248.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.248.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.248.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.249.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.249.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.249.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.250.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.250.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.250.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.251.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.251.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.251.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.252.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.252.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.252.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.253.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.253.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.253.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.254.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.254.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.254.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.255.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.255.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.255.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.input_layernorm.weight": "model-00092-of-000163.safetensors", + "model.layers.35.post_attention_layernorm.weight": "model-00092-of-000163.safetensors", + "model.layers.36.self_attn.q_a_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.self_attn.q_a_layernorm.weight": "model-00092-of-000163.safetensors", + "model.layers.36.self_attn.q_b_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.self_attn.kv_a_proj_with_mqa.weight": "model-00092-of-000163.safetensors", + "model.layers.36.self_attn.kv_a_layernorm.weight": "model-00092-of-000163.safetensors", + "model.layers.36.self_attn.kv_b_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.self_attn.o_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.gate.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.gate.e_score_correction_bias": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.shared_experts.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.shared_experts.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.shared_experts.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.0.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.0.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.0.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.1.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.1.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.1.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.2.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.2.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.2.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.3.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.3.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.3.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.4.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.4.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.4.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.5.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.5.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.5.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.6.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.6.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.6.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.7.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.7.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.7.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.8.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.8.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.8.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.9.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.9.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.9.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.10.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.10.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.10.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.11.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.11.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.11.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.12.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.12.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.12.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.13.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.13.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.13.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.14.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.14.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.14.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.15.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.15.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.15.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.16.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.16.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.16.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.17.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.17.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.17.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.18.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.18.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.18.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.19.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.19.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.19.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.20.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.20.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.20.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.21.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.21.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.21.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.22.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.22.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.22.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.23.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.23.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.23.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.24.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.24.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.24.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.25.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.25.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.25.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.26.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.26.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.26.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.27.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.27.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.27.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.28.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.28.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.28.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.29.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.29.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.29.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.30.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.30.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.30.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.31.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.31.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.31.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.32.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.32.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.32.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.33.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.33.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.33.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.34.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.34.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.34.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.35.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.35.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.35.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.36.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.36.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.36.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.37.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.37.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.37.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.38.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.38.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.38.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.39.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.39.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.39.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.40.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.40.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.40.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.41.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.41.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.41.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.42.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.42.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.42.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.43.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.43.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.43.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.44.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.44.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.44.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.45.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.45.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.45.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.46.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.46.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.46.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.47.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.47.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.47.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.48.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.48.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.48.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.49.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.49.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.49.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.50.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.50.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.50.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.51.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.51.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.51.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.52.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.52.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.52.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.53.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.53.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.53.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.54.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.54.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.54.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.55.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.55.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.55.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.56.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.56.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.56.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.57.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.57.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.57.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.58.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.58.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.58.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.59.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.59.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.59.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.60.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.60.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.60.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.61.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.61.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.61.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.62.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.62.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.62.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.63.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.63.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.63.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.64.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.64.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.64.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.65.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.65.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.65.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.66.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.66.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.66.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.67.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.67.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.67.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.68.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.68.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.68.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.69.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.69.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.69.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.70.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.70.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.70.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.71.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.71.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.71.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.72.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.72.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.72.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.73.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.73.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.73.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.74.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.74.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.74.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.75.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.75.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.75.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.76.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.76.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.76.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.77.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.77.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.77.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.78.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.78.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.78.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.79.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.79.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.79.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.80.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.80.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.80.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.81.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.81.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.81.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.82.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.82.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.82.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.83.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.83.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.83.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.84.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.84.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.84.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.85.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.85.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.85.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.86.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.86.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.86.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.87.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.87.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.87.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.88.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.88.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.88.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.89.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.89.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.89.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.90.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.90.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.90.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.91.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.91.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.91.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.92.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.92.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.92.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.93.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.93.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.93.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.94.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.94.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.94.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.95.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.95.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.95.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.96.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.96.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.96.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.97.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.97.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.97.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.98.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.98.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.98.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.99.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.99.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.99.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.100.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.100.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.100.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.101.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.101.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.101.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.102.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.102.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.102.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.103.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.103.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.103.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.104.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.104.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.104.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.105.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.105.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.105.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.106.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.106.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.106.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.107.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.107.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.107.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.108.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.108.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.108.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.109.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.109.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.109.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.110.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.110.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.110.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.111.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.111.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.111.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.112.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.112.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.112.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.113.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.113.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.113.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.114.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.114.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.114.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.115.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.115.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.115.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.116.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.116.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.116.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.117.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.117.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.117.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.118.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.118.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.118.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.119.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.119.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.119.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.120.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.120.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.120.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.121.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.121.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.121.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.122.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.122.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.122.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.123.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.123.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.123.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.124.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.124.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.124.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.125.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.125.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.125.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.126.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.126.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.126.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.127.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.127.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.127.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.128.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.128.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.128.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.129.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.129.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.129.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.130.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.130.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.130.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.131.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.131.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.131.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.132.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.132.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.132.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.133.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.133.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.133.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.134.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.134.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.134.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.135.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.135.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.135.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.136.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.136.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.136.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.137.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.137.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.137.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.138.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.138.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.138.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.139.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.139.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.139.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.140.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.140.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.140.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.141.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.141.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.141.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.142.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.142.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.142.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.143.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.143.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.143.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.144.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.144.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.144.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.145.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.145.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.145.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.146.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.146.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.146.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.147.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.147.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.147.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.148.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.148.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.148.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.149.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.149.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.149.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.150.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.150.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.150.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.151.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.151.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.151.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.152.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.152.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.152.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.153.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.153.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.153.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.154.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.154.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.154.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.155.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.155.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.155.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.156.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.156.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.156.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.157.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.157.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.157.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.158.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.158.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.158.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.159.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.159.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.159.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.160.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.160.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.160.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.161.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.161.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.161.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.162.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.162.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.162.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.163.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.163.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.163.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.164.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.164.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.164.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.165.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.165.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.165.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.166.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.166.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.166.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.167.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.167.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.167.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.168.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.168.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.168.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.169.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.169.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.169.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.170.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.170.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.170.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.171.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.171.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.171.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.172.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.172.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.172.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.173.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.173.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.173.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.174.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.174.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.174.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.175.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.175.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.175.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.176.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.176.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.176.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.177.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.177.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.177.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.178.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.178.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.178.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.179.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.179.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.179.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.180.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.180.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.180.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.181.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.181.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.181.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.182.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.182.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.182.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.183.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.183.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.183.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.184.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.184.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.184.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.185.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.185.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.185.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.186.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.186.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.186.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.187.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.187.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.187.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.188.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.188.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.188.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.189.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.189.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.189.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.190.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.190.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.190.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.191.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.191.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.191.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.192.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.192.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.192.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.193.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.193.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.193.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.194.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.194.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.194.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.195.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.195.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.195.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.196.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.196.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.196.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.197.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.197.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.197.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.198.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.198.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.198.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.199.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.199.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.199.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.200.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.200.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.200.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.201.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.201.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.201.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.202.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.202.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.202.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.203.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.203.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.203.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.204.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.204.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.204.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.205.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.205.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.205.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.206.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.206.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.206.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.207.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.207.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.207.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.208.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.208.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.208.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.209.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.209.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.209.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.210.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.210.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.210.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.211.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.211.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.211.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.212.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.212.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.212.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.213.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.213.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.213.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.214.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.214.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.214.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.215.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.215.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.215.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.216.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.216.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.216.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.217.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.217.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.217.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.218.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.218.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.218.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.219.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.219.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.219.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.220.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.220.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.220.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.221.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.221.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.221.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.222.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.222.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.222.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.223.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.223.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.223.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.224.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.224.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.224.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.225.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.225.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.225.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.226.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.226.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.226.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.227.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.227.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.227.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.228.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.228.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.228.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.229.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.229.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.229.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.230.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.230.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.230.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.231.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.231.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.231.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.232.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.232.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.232.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.233.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.233.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.233.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.234.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.234.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.234.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.235.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.235.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.235.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.236.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.236.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.236.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.237.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.237.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.237.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.238.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.238.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.238.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.239.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.239.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.239.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.240.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.240.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.240.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.241.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.241.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.241.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.242.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.242.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.242.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.243.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.243.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.243.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.244.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.244.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.244.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.245.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.245.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.245.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.246.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.246.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.246.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.247.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.247.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.247.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.248.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.248.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.248.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.249.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.249.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.249.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.250.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.250.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.250.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.251.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.251.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.251.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.252.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.252.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.252.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.253.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.253.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.253.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.254.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.254.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.254.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.255.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.255.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.255.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.input_layernorm.weight": "model-00095-of-000163.safetensors", + "model.layers.36.post_attention_layernorm.weight": "model-00095-of-000163.safetensors", + "model.layers.37.self_attn.q_a_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.self_attn.q_a_layernorm.weight": "model-00095-of-000163.safetensors", + "model.layers.37.self_attn.q_b_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.self_attn.kv_a_proj_with_mqa.weight": "model-00095-of-000163.safetensors", + "model.layers.37.self_attn.kv_a_layernorm.weight": "model-00095-of-000163.safetensors", + "model.layers.37.self_attn.kv_b_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.self_attn.o_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.gate.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.gate.e_score_correction_bias": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.shared_experts.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.shared_experts.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.shared_experts.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.0.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.0.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.0.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.1.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.1.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.1.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.2.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.2.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.2.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.3.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.3.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.3.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.4.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.4.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.4.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.5.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.5.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.5.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.6.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.6.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.6.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.7.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.7.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.7.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.8.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.8.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.8.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.9.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.9.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.9.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.10.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.10.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.10.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.11.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.11.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.11.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.12.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.12.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.12.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.13.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.13.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.13.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.14.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.14.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.14.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.15.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.15.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.15.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.16.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.16.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.16.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.17.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.17.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.17.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.18.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.18.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.18.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.19.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.19.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.19.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.20.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.20.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.20.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.21.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.21.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.21.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.22.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.22.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.22.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.23.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.23.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.23.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.24.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.24.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.24.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.25.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.25.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.25.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.26.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.26.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.26.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.27.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.27.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.27.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.28.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.28.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.28.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.29.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.29.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.29.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.30.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.30.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.30.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.31.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.31.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.31.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.32.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.32.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.32.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.33.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.33.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.33.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.34.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.34.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.34.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.35.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.35.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.35.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.36.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.36.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.36.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.37.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.37.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.37.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.38.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.38.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.38.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.39.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.39.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.39.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.40.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.40.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.40.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.41.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.41.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.41.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.42.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.42.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.42.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.43.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.43.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.43.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.44.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.44.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.44.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.45.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.45.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.45.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.46.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.46.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.46.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.47.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.47.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.47.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.48.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.48.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.48.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.49.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.49.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.49.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.50.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.50.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.50.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.51.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.51.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.51.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.52.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.52.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.52.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.53.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.53.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.53.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.54.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.54.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.54.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.55.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.55.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.55.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.56.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.56.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.56.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.57.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.57.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.57.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.58.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.58.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.58.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.59.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.59.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.59.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.60.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.60.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.60.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.61.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.61.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.61.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.62.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.62.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.62.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.63.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.63.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.63.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.64.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.64.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.64.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.65.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.65.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.65.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.66.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.66.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.66.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.67.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.67.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.67.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.68.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.68.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.68.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.69.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.69.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.69.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.70.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.70.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.70.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.71.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.71.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.71.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.72.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.72.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.72.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.73.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.73.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.73.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.74.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.74.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.74.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.75.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.75.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.75.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.76.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.76.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.76.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.77.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.77.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.77.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.78.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.78.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.78.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.79.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.79.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.79.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.80.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.80.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.80.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.81.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.81.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.81.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.82.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.82.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.82.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.83.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.83.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.83.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.84.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.84.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.84.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.85.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.85.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.85.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.86.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.86.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.86.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.87.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.87.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.87.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.88.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.88.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.88.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.89.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.89.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.89.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.90.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.90.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.90.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.91.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.91.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.91.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.92.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.92.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.92.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.93.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.93.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.93.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.94.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.94.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.94.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.95.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.95.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.95.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.96.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.96.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.96.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.97.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.97.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.97.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.98.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.98.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.98.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.99.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.99.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.99.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.100.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.100.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.100.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.101.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.101.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.101.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.102.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.102.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.102.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.103.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.103.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.103.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.104.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.104.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.104.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.105.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.105.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.105.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.106.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.106.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.106.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.107.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.107.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.107.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.108.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.108.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.108.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.109.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.109.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.109.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.110.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.110.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.110.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.111.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.111.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.111.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.112.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.112.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.112.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.113.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.113.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.113.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.114.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.114.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.114.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.115.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.115.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.115.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.116.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.116.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.116.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.117.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.117.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.117.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.118.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.118.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.118.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.119.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.119.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.119.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.120.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.120.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.120.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.121.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.121.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.121.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.122.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.122.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.122.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.123.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.123.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.123.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.124.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.124.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.124.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.125.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.125.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.125.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.126.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.126.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.126.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.127.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.127.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.127.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.128.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.128.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.128.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.129.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.129.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.129.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.130.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.130.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.130.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.131.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.131.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.131.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.132.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.132.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.132.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.133.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.133.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.133.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.134.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.134.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.134.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.135.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.135.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.135.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.136.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.136.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.136.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.137.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.137.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.137.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.138.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.138.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.138.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.139.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.139.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.139.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.140.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.140.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.140.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.141.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.141.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.141.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.142.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.142.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.142.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.143.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.143.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.143.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.144.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.144.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.144.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.145.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.145.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.145.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.146.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.146.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.146.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.147.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.147.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.147.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.148.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.148.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.148.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.149.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.149.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.149.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.150.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.150.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.150.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.151.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.151.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.151.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.152.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.152.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.152.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.153.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.153.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.153.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.154.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.154.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.154.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.155.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.155.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.155.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.156.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.156.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.156.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.157.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.157.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.157.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.158.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.158.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.158.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.159.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.159.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.159.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.160.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.160.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.160.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.161.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.161.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.161.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.162.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.162.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.162.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.163.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.163.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.163.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.164.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.164.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.164.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.165.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.165.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.165.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.166.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.166.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.166.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.167.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.167.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.167.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.168.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.168.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.168.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.169.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.169.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.169.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.170.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.170.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.170.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.171.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.171.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.171.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.172.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.172.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.172.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.173.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.173.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.173.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.174.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.174.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.174.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.175.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.175.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.175.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.176.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.176.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.176.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.177.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.177.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.177.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.178.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.178.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.178.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.179.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.179.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.179.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.180.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.180.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.180.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.181.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.181.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.181.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.182.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.182.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.182.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.183.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.183.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.183.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.184.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.184.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.184.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.185.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.185.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.185.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.186.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.186.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.186.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.187.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.187.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.187.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.188.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.188.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.188.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.189.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.189.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.189.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.190.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.190.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.190.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.191.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.191.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.191.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.192.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.192.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.192.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.193.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.193.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.193.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.194.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.194.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.194.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.195.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.195.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.195.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.196.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.196.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.196.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.197.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.197.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.197.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.198.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.198.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.198.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.199.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.199.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.199.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.200.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.200.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.200.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.201.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.201.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.201.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.202.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.202.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.202.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.203.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.203.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.203.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.204.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.204.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.204.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.205.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.205.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.205.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.206.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.206.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.206.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.207.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.207.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.207.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.208.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.208.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.208.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.209.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.209.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.209.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.210.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.210.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.210.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.211.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.211.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.211.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.212.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.212.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.212.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.213.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.213.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.213.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.214.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.214.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.214.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.215.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.215.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.215.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.216.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.216.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.216.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.217.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.217.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.217.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.218.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.218.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.218.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.219.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.219.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.219.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.220.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.220.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.220.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.221.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.221.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.221.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.222.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.222.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.222.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.223.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.223.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.223.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.224.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.224.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.224.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.225.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.225.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.225.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.226.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.226.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.226.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.227.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.227.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.227.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.228.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.228.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.228.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.229.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.229.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.229.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.230.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.230.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.230.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.231.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.231.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.231.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.232.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.232.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.232.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.233.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.233.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.233.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.234.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.234.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.234.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.235.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.235.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.235.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.236.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.236.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.236.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.237.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.237.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.237.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.238.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.238.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.238.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.239.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.239.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.239.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.240.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.240.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.240.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.241.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.241.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.241.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.242.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.242.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.242.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.243.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.243.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.243.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.244.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.244.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.244.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.245.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.245.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.245.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.246.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.246.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.246.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.247.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.247.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.247.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.248.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.248.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.248.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.249.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.249.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.249.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.250.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.250.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.250.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.251.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.251.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.251.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.252.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.252.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.252.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.253.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.253.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.253.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.254.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.254.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.254.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.255.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.255.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.255.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.input_layernorm.weight": "model-00097-of-000163.safetensors", + "model.layers.37.post_attention_layernorm.weight": "model-00097-of-000163.safetensors", + "model.layers.38.self_attn.q_a_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.self_attn.q_a_layernorm.weight": "model-00097-of-000163.safetensors", + "model.layers.38.self_attn.q_b_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.self_attn.kv_a_proj_with_mqa.weight": "model-00097-of-000163.safetensors", + "model.layers.38.self_attn.kv_a_layernorm.weight": "model-00097-of-000163.safetensors", + "model.layers.38.self_attn.kv_b_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.self_attn.o_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.gate.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.gate.e_score_correction_bias": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.shared_experts.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.shared_experts.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.shared_experts.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.0.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.0.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.0.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.1.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.1.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.1.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.2.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.2.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.2.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.3.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.3.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.3.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.4.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.4.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.4.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.5.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.5.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.5.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.6.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.6.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.6.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.7.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.7.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.7.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.8.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.8.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.8.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.9.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.9.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.9.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.10.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.10.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.10.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.11.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.11.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.11.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.12.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.12.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.12.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.13.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.13.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.13.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.14.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.14.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.14.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.15.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.15.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.15.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.16.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.16.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.16.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.17.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.17.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.17.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.18.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.18.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.18.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.19.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.19.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.19.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.20.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.20.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.20.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.21.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.21.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.21.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.22.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.22.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.22.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.23.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.23.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.23.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.24.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.24.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.24.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.25.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.25.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.25.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.26.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.26.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.26.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.27.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.27.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.27.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.28.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.28.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.28.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.29.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.29.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.29.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.30.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.30.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.30.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.31.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.31.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.31.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.32.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.32.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.32.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.33.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.33.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.33.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.34.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.34.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.34.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.35.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.35.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.35.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.36.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.36.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.36.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.37.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.37.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.37.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.38.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.38.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.38.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.39.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.39.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.39.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.40.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.40.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.40.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.41.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.41.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.41.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.42.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.42.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.42.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.43.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.43.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.43.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.44.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.44.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.44.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.45.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.45.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.45.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.46.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.46.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.46.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.47.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.47.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.47.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.48.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.48.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.48.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.49.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.49.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.49.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.50.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.50.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.50.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.51.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.51.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.51.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.52.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.52.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.52.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.53.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.53.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.53.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.54.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.54.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.54.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.55.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.55.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.55.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.56.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.56.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.56.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.57.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.57.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.57.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.58.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.58.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.58.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.59.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.59.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.59.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.60.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.60.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.60.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.61.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.61.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.61.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.62.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.62.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.62.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.63.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.63.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.63.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.64.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.64.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.64.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.65.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.65.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.65.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.66.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.66.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.66.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.67.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.67.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.67.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.68.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.68.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.68.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.69.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.69.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.69.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.70.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.70.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.70.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.71.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.71.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.71.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.72.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.72.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.72.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.73.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.73.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.73.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.74.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.74.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.74.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.75.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.75.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.75.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.76.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.76.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.76.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.77.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.77.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.77.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.78.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.78.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.78.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.79.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.79.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.79.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.80.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.80.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.80.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.81.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.81.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.81.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.82.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.82.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.82.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.83.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.83.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.83.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.84.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.84.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.84.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.85.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.85.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.85.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.86.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.86.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.86.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.87.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.87.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.87.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.88.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.88.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.88.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.89.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.89.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.89.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.90.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.90.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.90.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.91.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.91.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.91.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.92.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.92.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.92.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.93.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.93.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.93.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.94.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.94.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.94.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.95.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.95.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.95.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.96.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.96.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.96.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.97.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.97.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.97.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.98.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.98.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.98.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.99.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.99.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.99.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.100.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.100.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.100.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.101.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.101.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.101.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.102.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.102.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.102.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.103.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.103.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.103.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.104.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.104.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.104.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.105.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.105.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.105.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.106.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.106.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.106.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.107.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.107.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.107.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.108.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.108.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.108.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.109.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.109.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.109.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.110.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.110.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.110.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.111.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.111.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.111.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.112.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.112.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.112.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.113.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.113.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.113.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.114.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.114.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.114.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.115.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.115.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.115.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.116.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.116.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.116.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.117.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.117.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.117.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.118.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.118.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.118.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.119.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.119.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.119.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.120.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.120.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.120.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.121.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.121.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.121.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.122.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.122.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.122.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.123.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.123.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.123.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.124.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.124.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.124.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.125.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.125.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.125.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.126.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.126.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.126.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.127.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.127.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.127.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.128.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.128.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.128.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.129.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.129.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.129.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.130.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.130.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.130.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.131.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.131.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.131.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.132.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.132.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.132.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.133.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.133.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.133.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.134.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.134.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.134.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.135.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.135.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.135.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.136.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.136.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.136.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.137.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.137.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.137.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.138.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.138.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.138.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.139.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.139.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.139.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.140.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.140.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.140.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.141.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.141.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.141.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.142.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.142.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.142.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.143.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.143.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.143.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.144.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.144.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.144.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.145.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.145.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.145.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.146.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.146.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.146.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.147.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.147.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.147.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.148.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.148.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.148.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.149.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.149.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.149.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.150.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.150.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.150.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.151.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.151.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.151.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.152.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.152.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.152.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.153.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.153.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.153.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.154.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.154.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.154.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.155.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.155.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.155.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.156.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.156.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.156.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.157.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.157.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.157.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.158.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.158.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.158.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.159.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.159.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.159.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.160.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.160.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.160.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.161.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.161.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.161.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.162.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.162.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.162.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.163.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.163.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.163.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.164.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.164.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.164.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.165.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.165.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.165.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.166.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.166.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.166.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.167.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.167.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.167.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.168.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.168.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.168.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.169.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.169.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.169.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.170.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.170.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.170.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.171.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.171.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.171.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.172.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.172.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.172.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.173.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.173.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.173.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.174.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.174.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.174.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.175.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.175.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.175.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.176.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.176.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.176.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.177.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.177.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.177.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.178.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.178.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.178.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.179.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.179.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.179.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.180.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.180.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.180.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.181.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.181.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.181.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.182.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.182.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.182.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.183.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.183.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.183.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.184.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.184.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.184.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.185.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.185.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.185.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.186.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.186.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.186.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.187.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.187.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.187.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.188.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.188.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.188.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.189.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.189.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.189.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.190.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.190.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.190.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.191.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.191.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.191.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.192.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.192.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.192.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.193.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.193.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.193.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.194.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.194.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.194.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.195.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.195.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.195.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.196.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.196.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.196.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.197.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.197.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.197.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.198.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.198.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.198.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.199.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.199.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.199.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.200.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.200.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.200.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.201.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.201.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.201.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.202.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.202.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.202.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.203.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.203.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.203.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.204.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.204.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.204.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.205.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.205.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.205.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.206.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.206.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.206.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.207.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.207.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.207.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.208.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.208.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.208.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.209.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.209.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.209.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.210.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.210.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.210.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.211.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.211.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.211.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.212.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.212.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.212.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.213.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.213.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.213.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.214.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.214.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.214.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.215.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.215.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.215.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.216.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.216.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.216.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.217.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.217.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.217.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.218.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.218.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.218.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.219.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.219.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.219.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.220.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.220.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.220.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.221.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.221.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.221.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.222.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.222.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.222.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.223.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.223.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.223.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.224.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.224.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.224.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.225.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.225.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.225.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.226.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.226.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.226.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.227.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.227.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.227.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.228.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.228.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.228.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.229.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.229.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.229.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.230.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.230.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.230.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.231.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.231.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.231.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.232.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.232.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.232.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.233.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.233.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.233.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.234.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.234.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.234.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.235.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.235.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.235.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.236.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.236.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.236.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.237.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.237.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.237.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.238.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.238.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.238.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.239.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.239.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.239.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.240.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.240.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.240.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.241.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.241.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.241.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.242.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.242.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.242.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.243.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.243.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.243.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.244.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.244.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.244.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.245.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.245.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.245.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.246.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.246.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.246.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.247.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.247.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.247.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.248.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.248.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.248.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.249.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.249.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.249.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.250.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.250.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.250.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.251.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.251.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.251.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.252.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.252.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.252.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.253.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.253.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.253.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.254.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.254.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.254.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.255.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.255.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.255.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.input_layernorm.weight": "model-00100-of-000163.safetensors", + "model.layers.38.post_attention_layernorm.weight": "model-00100-of-000163.safetensors", + "model.layers.39.self_attn.q_a_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.self_attn.q_a_layernorm.weight": "model-00101-of-000163.safetensors", + "model.layers.39.self_attn.q_b_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.self_attn.kv_a_proj_with_mqa.weight": "model-00101-of-000163.safetensors", + "model.layers.39.self_attn.kv_a_layernorm.weight": "model-00101-of-000163.safetensors", + "model.layers.39.self_attn.kv_b_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.self_attn.o_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.gate.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.gate.e_score_correction_bias": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.shared_experts.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.shared_experts.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.shared_experts.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.0.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.0.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.0.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.1.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.1.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.1.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.2.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.2.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.2.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.3.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.3.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.3.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.4.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.4.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.4.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.5.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.5.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.5.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.6.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.6.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.6.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.7.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.7.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.7.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.8.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.8.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.8.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.9.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.9.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.9.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.10.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.10.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.10.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.11.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.11.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.11.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.12.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.12.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.12.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.13.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.13.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.13.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.14.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.14.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.14.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.15.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.15.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.15.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.16.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.16.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.16.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.17.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.17.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.17.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.18.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.18.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.18.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.19.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.19.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.19.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.20.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.20.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.20.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.21.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.21.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.21.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.22.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.22.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.22.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.23.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.23.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.23.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.24.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.24.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.24.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.25.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.25.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.25.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.26.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.26.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.26.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.27.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.27.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.27.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.28.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.28.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.28.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.29.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.29.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.29.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.30.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.30.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.30.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.31.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.31.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.31.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.32.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.32.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.32.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.33.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.33.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.33.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.34.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.34.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.34.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.35.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.35.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.35.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.36.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.36.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.36.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.37.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.37.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.37.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.38.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.38.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.38.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.39.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.39.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.39.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.40.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.40.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.40.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.41.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.41.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.41.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.42.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.42.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.42.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.43.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.43.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.43.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.44.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.44.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.44.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.45.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.45.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.45.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.46.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.46.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.46.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.47.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.47.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.47.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.48.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.48.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.48.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.49.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.49.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.49.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.50.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.50.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.50.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.51.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.51.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.51.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.52.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.52.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.52.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.53.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.53.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.53.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.54.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.54.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.54.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.55.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.55.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.55.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.56.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.56.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.56.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.57.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.57.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.57.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.58.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.58.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.58.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.59.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.59.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.59.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.60.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.60.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.60.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.61.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.61.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.61.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.62.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.62.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.62.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.63.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.63.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.63.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.64.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.64.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.64.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.65.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.65.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.65.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.66.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.66.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.66.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.67.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.67.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.67.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.68.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.68.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.68.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.69.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.69.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.69.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.70.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.70.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.70.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.71.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.71.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.71.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.72.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.72.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.72.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.73.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.73.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.73.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.74.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.74.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.74.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.75.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.75.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.75.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.76.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.76.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.76.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.77.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.77.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.77.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.78.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.78.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.78.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.79.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.79.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.79.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.80.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.80.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.80.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.81.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.81.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.81.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.82.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.82.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.82.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.83.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.83.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.83.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.84.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.84.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.84.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.85.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.85.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.85.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.86.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.86.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.86.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.87.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.87.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.87.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.88.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.88.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.88.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.89.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.89.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.89.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.90.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.90.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.90.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.91.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.91.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.91.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.92.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.92.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.92.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.93.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.93.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.93.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.94.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.94.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.94.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.95.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.95.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.95.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.96.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.96.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.96.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.97.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.97.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.97.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.98.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.98.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.98.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.99.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.99.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.99.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.100.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.100.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.100.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.101.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.101.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.101.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.102.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.102.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.102.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.103.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.103.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.103.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.104.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.104.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.104.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.105.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.105.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.105.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.106.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.106.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.106.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.107.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.107.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.107.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.108.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.108.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.108.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.109.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.109.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.109.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.110.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.110.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.110.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.111.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.111.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.111.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.112.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.112.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.112.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.113.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.113.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.113.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.114.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.114.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.114.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.115.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.115.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.115.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.116.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.116.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.116.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.117.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.117.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.117.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.118.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.118.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.118.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.119.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.119.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.119.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.120.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.120.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.120.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.121.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.121.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.121.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.122.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.122.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.122.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.123.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.123.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.123.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.124.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.124.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.124.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.125.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.125.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.125.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.126.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.126.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.126.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.127.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.127.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.127.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.128.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.128.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.128.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.129.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.129.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.129.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.130.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.130.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.130.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.131.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.131.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.131.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.132.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.132.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.132.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.133.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.133.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.133.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.134.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.134.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.134.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.135.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.135.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.135.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.136.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.136.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.136.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.137.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.137.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.137.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.138.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.138.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.138.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.139.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.139.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.139.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.140.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.140.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.140.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.141.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.141.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.141.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.142.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.142.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.142.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.143.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.143.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.143.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.144.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.144.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.144.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.145.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.145.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.145.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.146.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.146.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.146.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.147.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.147.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.147.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.148.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.148.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.148.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.149.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.149.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.149.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.150.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.150.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.150.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.151.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.151.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.151.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.152.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.152.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.152.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.153.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.153.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.153.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.154.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.154.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.154.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.155.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.155.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.155.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.156.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.156.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.156.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.157.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.157.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.157.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.158.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.158.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.158.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.159.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.159.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.159.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.160.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.160.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.160.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.161.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.161.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.161.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.162.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.162.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.162.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.163.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.163.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.163.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.164.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.164.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.164.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.165.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.165.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.165.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.166.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.166.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.166.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.167.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.167.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.167.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.168.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.168.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.168.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.169.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.169.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.169.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.170.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.170.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.170.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.171.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.171.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.171.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.172.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.172.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.172.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.173.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.173.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.173.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.174.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.174.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.174.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.175.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.175.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.175.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.176.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.176.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.176.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.177.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.177.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.177.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.178.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.178.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.178.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.179.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.179.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.179.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.180.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.180.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.180.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.181.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.181.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.181.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.182.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.182.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.182.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.183.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.183.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.183.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.184.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.184.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.184.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.185.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.185.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.185.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.186.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.186.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.186.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.187.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.187.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.187.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.188.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.188.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.188.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.189.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.189.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.189.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.190.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.190.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.190.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.191.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.191.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.191.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.192.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.192.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.192.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.193.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.193.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.193.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.194.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.194.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.194.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.195.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.195.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.195.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.196.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.196.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.196.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.197.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.197.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.197.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.198.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.198.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.198.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.199.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.199.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.199.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.200.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.200.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.200.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.201.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.201.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.201.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.202.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.202.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.202.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.203.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.203.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.203.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.204.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.204.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.204.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.205.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.205.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.205.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.206.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.206.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.206.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.207.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.207.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.207.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.208.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.208.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.208.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.209.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.209.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.209.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.210.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.210.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.210.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.211.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.211.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.211.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.212.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.212.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.212.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.213.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.213.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.213.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.214.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.214.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.214.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.215.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.215.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.215.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.216.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.216.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.216.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.217.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.217.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.217.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.218.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.218.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.218.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.219.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.219.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.219.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.220.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.220.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.220.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.221.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.221.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.221.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.222.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.222.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.222.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.223.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.223.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.223.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.224.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.224.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.224.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.225.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.225.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.225.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.226.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.226.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.226.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.227.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.227.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.227.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.228.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.228.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.228.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.229.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.229.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.229.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.230.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.230.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.230.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.231.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.231.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.231.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.232.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.232.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.232.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.233.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.233.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.233.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.234.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.234.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.234.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.235.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.235.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.235.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.236.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.236.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.236.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.237.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.237.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.237.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.238.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.238.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.238.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.239.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.239.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.239.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.240.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.240.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.240.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.241.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.241.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.241.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.242.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.242.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.242.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.243.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.243.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.243.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.244.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.244.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.244.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.245.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.245.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.245.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.246.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.246.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.246.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.247.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.247.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.247.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.248.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.248.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.248.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.249.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.249.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.249.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.250.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.250.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.250.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.251.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.251.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.251.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.252.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.252.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.252.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.253.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.253.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.253.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.254.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.254.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.254.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.255.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.255.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.255.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.input_layernorm.weight": "model-00103-of-000163.safetensors", + "model.layers.39.post_attention_layernorm.weight": "model-00103-of-000163.safetensors", + "model.layers.40.self_attn.q_a_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.self_attn.q_a_layernorm.weight": "model-00103-of-000163.safetensors", + "model.layers.40.self_attn.q_b_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.self_attn.kv_a_proj_with_mqa.weight": "model-00103-of-000163.safetensors", + "model.layers.40.self_attn.kv_a_layernorm.weight": "model-00103-of-000163.safetensors", + "model.layers.40.self_attn.kv_b_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.self_attn.o_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.gate.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.gate.e_score_correction_bias": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.shared_experts.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.shared_experts.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.shared_experts.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.0.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.0.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.0.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.1.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.1.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.1.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.2.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.2.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.2.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.3.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.3.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.3.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.4.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.4.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.4.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.5.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.5.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.5.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.6.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.6.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.6.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.7.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.7.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.7.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.8.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.8.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.8.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.9.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.9.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.9.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.10.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.10.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.10.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.11.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.11.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.11.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.12.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.12.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.12.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.13.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.13.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.13.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.14.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.14.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.14.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.15.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.15.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.15.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.16.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.16.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.16.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.17.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.17.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.17.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.18.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.18.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.18.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.19.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.19.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.19.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.20.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.20.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.20.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.21.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.21.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.21.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.22.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.22.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.22.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.23.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.23.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.23.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.24.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.24.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.24.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.25.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.25.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.25.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.26.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.26.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.26.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.27.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.27.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.27.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.28.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.28.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.28.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.29.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.29.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.29.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.30.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.30.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.30.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.31.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.31.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.31.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.32.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.32.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.32.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.33.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.33.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.33.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.34.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.34.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.34.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.35.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.35.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.35.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.36.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.36.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.36.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.37.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.37.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.37.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.38.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.38.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.38.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.39.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.39.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.39.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.40.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.40.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.40.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.41.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.41.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.41.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.42.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.42.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.42.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.43.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.43.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.43.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.44.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.44.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.44.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.45.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.45.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.45.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.46.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.46.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.46.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.47.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.47.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.47.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.48.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.48.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.48.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.49.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.49.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.49.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.50.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.50.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.50.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.51.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.51.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.51.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.52.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.52.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.52.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.53.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.53.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.53.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.54.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.54.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.54.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.55.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.55.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.55.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.56.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.56.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.56.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.57.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.57.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.57.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.58.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.58.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.58.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.59.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.59.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.59.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.60.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.60.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.60.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.61.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.61.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.61.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.62.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.62.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.62.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.63.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.63.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.63.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.64.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.64.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.64.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.65.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.65.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.65.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.66.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.66.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.66.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.67.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.67.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.67.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.68.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.68.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.68.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.69.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.69.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.69.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.70.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.70.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.70.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.71.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.71.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.71.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.72.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.72.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.72.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.73.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.73.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.73.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.74.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.74.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.74.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.75.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.75.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.75.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.76.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.76.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.76.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.77.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.77.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.77.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.78.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.78.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.78.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.79.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.79.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.79.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.80.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.80.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.80.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.81.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.81.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.81.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.82.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.82.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.82.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.83.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.83.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.83.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.84.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.84.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.84.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.85.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.85.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.85.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.86.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.86.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.86.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.87.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.87.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.87.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.88.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.88.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.88.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.89.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.89.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.89.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.90.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.90.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.90.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.91.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.91.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.91.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.92.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.92.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.92.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.93.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.93.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.93.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.94.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.94.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.94.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.95.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.95.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.95.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.96.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.96.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.96.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.97.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.97.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.97.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.98.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.98.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.98.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.99.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.99.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.99.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.100.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.100.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.100.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.101.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.101.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.101.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.102.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.102.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.102.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.103.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.103.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.103.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.104.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.104.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.104.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.105.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.105.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.105.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.106.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.106.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.106.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.107.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.107.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.107.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.108.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.108.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.108.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.109.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.109.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.109.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.110.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.110.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.110.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.111.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.111.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.111.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.112.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.112.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.112.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.113.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.113.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.113.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.114.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.114.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.114.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.115.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.115.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.115.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.116.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.116.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.116.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.117.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.117.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.117.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.118.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.118.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.118.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.119.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.119.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.119.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.120.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.120.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.120.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.121.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.121.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.121.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.122.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.122.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.122.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.123.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.123.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.123.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.124.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.124.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.124.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.125.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.125.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.125.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.126.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.126.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.126.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.127.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.127.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.127.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.128.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.128.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.128.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.129.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.129.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.129.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.130.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.130.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.130.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.131.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.131.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.131.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.132.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.132.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.132.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.133.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.133.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.133.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.134.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.134.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.134.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.135.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.135.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.135.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.136.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.136.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.136.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.137.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.137.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.137.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.138.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.138.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.138.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.139.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.139.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.139.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.140.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.140.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.140.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.141.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.141.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.141.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.142.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.142.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.142.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.143.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.143.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.143.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.144.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.144.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.144.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.145.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.145.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.145.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.146.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.146.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.146.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.147.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.147.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.147.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.148.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.148.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.148.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.149.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.149.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.149.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.150.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.150.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.150.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.151.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.151.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.151.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.152.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.152.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.152.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.153.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.153.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.153.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.154.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.154.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.154.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.155.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.155.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.155.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.156.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.156.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.156.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.157.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.157.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.157.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.158.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.158.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.158.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.159.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.159.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.159.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.160.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.160.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.160.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.161.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.161.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.161.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.162.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.162.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.162.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.163.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.163.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.163.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.164.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.164.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.164.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.165.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.165.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.165.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.166.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.166.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.166.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.167.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.167.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.167.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.168.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.168.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.168.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.169.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.169.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.169.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.170.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.170.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.170.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.171.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.171.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.171.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.172.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.172.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.172.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.173.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.173.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.173.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.174.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.174.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.174.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.175.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.175.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.175.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.176.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.176.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.176.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.177.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.177.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.177.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.178.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.178.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.178.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.179.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.179.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.179.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.180.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.180.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.180.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.181.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.181.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.181.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.182.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.182.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.182.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.183.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.183.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.183.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.184.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.184.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.184.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.185.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.185.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.185.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.186.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.186.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.186.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.187.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.187.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.187.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.188.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.188.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.188.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.189.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.189.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.189.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.190.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.190.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.190.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.191.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.191.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.191.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.192.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.192.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.192.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.193.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.193.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.193.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.194.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.194.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.194.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.195.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.195.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.195.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.196.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.196.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.196.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.197.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.197.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.197.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.198.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.198.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.198.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.199.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.199.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.199.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.200.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.200.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.200.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.201.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.201.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.201.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.202.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.202.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.202.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.203.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.203.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.203.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.204.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.204.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.204.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.205.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.205.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.205.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.206.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.206.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.206.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.207.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.207.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.207.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.208.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.208.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.208.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.209.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.209.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.209.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.210.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.210.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.210.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.211.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.211.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.211.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.212.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.212.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.212.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.213.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.213.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.213.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.214.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.214.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.214.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.215.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.215.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.215.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.216.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.216.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.216.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.217.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.217.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.217.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.218.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.218.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.218.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.219.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.219.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.219.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.220.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.220.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.220.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.221.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.221.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.221.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.222.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.222.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.222.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.223.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.223.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.223.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.224.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.224.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.224.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.225.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.225.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.225.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.226.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.226.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.226.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.227.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.227.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.227.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.228.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.228.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.228.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.229.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.229.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.229.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.230.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.230.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.230.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.231.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.231.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.231.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.232.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.232.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.232.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.233.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.233.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.233.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.234.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.234.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.234.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.235.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.235.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.235.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.236.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.236.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.236.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.237.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.237.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.237.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.238.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.238.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.238.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.239.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.239.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.239.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.240.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.240.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.240.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.241.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.241.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.241.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.242.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.242.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.242.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.243.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.243.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.243.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.244.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.244.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.244.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.245.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.245.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.245.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.246.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.246.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.246.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.247.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.247.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.247.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.248.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.248.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.248.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.249.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.249.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.249.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.250.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.250.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.250.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.251.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.251.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.251.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.252.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.252.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.252.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.253.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.253.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.253.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.254.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.254.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.254.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.255.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.255.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.255.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.input_layernorm.weight": "model-00106-of-000163.safetensors", + "model.layers.40.post_attention_layernorm.weight": "model-00106-of-000163.safetensors", + "model.layers.41.self_attn.q_a_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.self_attn.q_a_layernorm.weight": "model-00106-of-000163.safetensors", + "model.layers.41.self_attn.q_b_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.self_attn.kv_a_proj_with_mqa.weight": "model-00106-of-000163.safetensors", + "model.layers.41.self_attn.kv_a_layernorm.weight": "model-00106-of-000163.safetensors", + "model.layers.41.self_attn.kv_b_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.self_attn.o_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.gate.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.gate.e_score_correction_bias": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.shared_experts.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.shared_experts.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.shared_experts.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.0.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.0.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.0.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.1.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.1.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.1.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.2.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.2.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.2.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.3.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.3.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.3.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.4.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.4.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.4.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.5.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.5.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.5.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.6.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.6.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.6.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.7.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.7.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.7.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.8.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.8.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.8.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.9.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.9.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.9.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.10.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.10.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.10.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.11.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.11.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.11.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.12.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.12.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.12.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.13.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.13.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.13.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.14.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.14.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.14.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.15.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.15.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.15.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.16.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.16.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.16.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.17.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.17.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.17.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.18.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.18.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.18.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.19.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.19.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.19.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.20.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.20.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.20.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.21.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.21.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.21.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.22.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.22.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.22.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.23.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.23.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.23.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.24.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.24.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.24.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.25.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.25.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.25.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.26.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.26.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.26.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.27.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.27.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.27.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.28.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.28.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.28.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.29.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.29.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.29.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.30.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.30.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.30.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.31.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.31.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.31.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.32.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.32.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.32.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.33.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.33.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.33.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.34.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.34.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.34.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.35.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.35.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.35.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.36.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.36.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.36.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.37.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.37.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.37.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.38.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.38.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.38.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.39.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.39.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.39.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.40.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.40.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.40.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.41.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.41.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.41.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.42.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.42.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.42.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.43.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.43.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.43.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.44.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.44.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.44.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.45.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.45.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.45.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.46.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.46.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.46.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.47.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.47.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.47.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.48.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.48.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.48.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.49.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.49.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.49.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.50.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.50.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.50.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.51.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.51.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.51.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.52.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.52.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.52.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.53.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.53.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.53.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.54.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.54.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.54.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.55.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.55.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.55.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.56.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.56.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.56.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.57.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.57.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.57.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.58.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.58.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.58.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.59.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.59.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.59.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.60.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.60.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.60.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.61.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.61.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.61.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.62.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.62.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.62.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.63.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.63.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.63.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.64.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.64.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.64.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.65.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.65.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.65.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.66.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.66.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.66.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.67.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.67.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.67.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.68.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.68.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.68.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.69.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.69.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.69.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.70.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.70.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.70.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.71.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.71.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.71.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.72.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.72.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.72.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.73.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.73.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.73.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.74.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.74.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.74.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.75.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.75.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.75.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.76.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.76.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.76.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.77.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.77.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.77.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.78.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.78.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.78.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.79.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.79.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.79.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.80.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.80.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.80.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.81.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.81.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.81.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.82.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.82.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.82.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.83.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.83.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.83.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.84.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.84.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.84.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.85.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.85.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.85.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.86.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.86.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.86.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.87.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.87.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.87.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.88.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.88.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.88.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.89.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.89.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.89.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.90.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.90.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.90.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.91.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.91.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.91.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.92.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.92.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.92.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.93.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.93.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.93.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.94.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.94.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.94.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.95.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.95.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.95.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.96.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.96.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.96.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.97.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.97.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.97.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.98.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.98.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.98.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.99.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.99.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.99.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.100.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.100.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.100.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.101.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.101.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.101.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.102.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.102.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.102.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.103.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.103.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.103.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.104.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.104.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.104.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.105.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.105.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.105.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.106.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.106.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.106.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.107.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.107.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.107.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.108.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.108.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.108.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.109.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.109.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.109.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.110.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.110.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.110.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.111.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.111.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.111.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.112.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.112.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.112.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.113.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.113.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.113.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.114.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.114.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.114.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.115.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.115.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.115.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.116.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.116.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.116.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.117.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.117.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.117.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.118.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.118.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.118.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.119.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.119.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.119.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.120.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.120.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.120.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.121.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.121.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.121.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.122.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.122.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.122.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.123.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.123.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.123.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.124.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.124.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.124.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.125.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.125.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.125.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.126.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.126.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.126.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.127.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.127.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.127.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.128.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.128.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.128.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.129.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.129.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.129.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.130.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.130.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.130.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.131.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.131.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.131.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.132.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.132.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.132.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.133.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.133.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.133.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.134.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.134.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.134.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.135.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.135.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.135.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.136.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.136.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.136.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.137.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.137.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.137.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.138.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.138.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.138.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.139.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.139.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.139.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.140.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.140.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.140.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.141.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.141.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.141.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.142.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.142.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.142.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.143.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.143.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.143.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.144.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.144.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.144.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.145.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.145.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.145.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.146.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.146.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.146.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.147.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.147.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.147.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.148.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.148.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.148.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.149.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.149.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.149.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.150.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.150.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.150.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.151.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.151.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.151.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.152.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.152.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.152.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.153.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.153.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.153.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.154.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.154.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.154.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.155.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.155.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.155.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.156.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.156.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.156.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.157.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.157.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.157.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.158.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.158.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.158.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.159.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.159.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.159.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.160.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.160.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.160.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.161.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.161.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.161.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.162.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.162.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.162.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.163.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.163.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.163.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.164.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.164.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.164.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.165.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.165.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.165.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.166.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.166.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.166.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.167.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.167.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.167.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.168.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.168.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.168.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.169.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.169.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.169.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.170.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.170.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.170.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.171.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.171.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.171.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.172.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.172.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.172.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.173.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.173.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.173.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.174.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.174.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.174.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.175.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.175.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.175.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.176.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.176.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.176.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.177.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.177.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.177.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.178.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.178.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.178.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.179.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.179.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.179.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.180.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.180.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.180.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.181.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.181.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.181.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.182.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.182.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.182.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.183.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.183.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.183.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.184.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.184.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.184.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.185.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.185.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.185.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.186.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.186.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.186.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.187.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.187.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.187.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.188.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.188.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.188.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.189.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.189.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.189.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.190.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.190.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.190.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.191.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.191.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.191.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.192.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.192.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.192.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.193.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.193.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.193.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.194.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.194.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.194.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.195.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.195.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.195.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.196.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.196.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.196.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.197.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.197.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.197.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.198.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.198.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.198.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.199.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.199.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.199.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.200.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.200.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.200.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.201.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.201.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.201.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.202.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.202.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.202.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.203.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.203.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.203.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.204.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.204.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.204.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.205.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.205.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.205.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.206.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.206.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.206.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.207.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.207.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.207.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.208.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.208.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.208.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.209.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.209.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.209.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.210.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.210.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.210.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.211.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.211.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.211.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.212.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.212.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.212.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.213.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.213.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.213.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.214.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.214.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.214.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.215.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.215.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.215.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.216.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.216.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.216.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.217.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.217.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.217.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.218.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.218.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.218.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.219.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.219.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.219.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.220.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.220.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.220.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.221.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.221.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.221.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.222.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.222.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.222.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.223.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.223.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.223.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.224.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.224.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.224.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.225.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.225.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.225.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.226.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.226.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.226.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.227.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.227.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.227.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.228.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.228.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.228.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.229.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.229.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.229.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.230.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.230.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.230.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.231.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.231.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.231.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.232.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.232.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.232.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.233.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.233.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.233.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.234.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.234.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.234.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.235.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.235.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.235.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.236.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.236.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.236.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.237.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.237.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.237.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.238.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.238.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.238.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.239.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.239.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.239.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.240.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.240.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.240.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.241.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.241.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.241.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.242.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.242.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.242.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.243.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.243.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.243.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.244.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.244.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.244.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.245.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.245.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.245.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.246.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.246.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.246.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.247.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.247.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.247.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.248.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.248.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.248.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.249.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.249.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.249.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.250.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.250.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.250.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.251.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.251.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.251.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.252.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.252.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.252.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.253.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.253.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.41.mlp.experts.253.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.41.mlp.experts.254.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.41.mlp.experts.254.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.41.mlp.experts.254.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.41.mlp.experts.255.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.41.mlp.experts.255.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.41.mlp.experts.255.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.41.input_layernorm.weight": "model-00109-of-000163.safetensors", + "model.layers.41.post_attention_layernorm.weight": "model-00109-of-000163.safetensors", + "model.layers.42.self_attn.q_a_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.self_attn.q_a_layernorm.weight": "model-00109-of-000163.safetensors", + "model.layers.42.self_attn.q_b_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.self_attn.kv_a_proj_with_mqa.weight": "model-00109-of-000163.safetensors", + "model.layers.42.self_attn.kv_a_layernorm.weight": "model-00109-of-000163.safetensors", + "model.layers.42.self_attn.kv_b_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.self_attn.o_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.gate.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.gate.e_score_correction_bias": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.shared_experts.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.shared_experts.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.shared_experts.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.0.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.0.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.0.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.1.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.1.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.1.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.2.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.2.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.2.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.3.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.3.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.3.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.4.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.4.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.4.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.5.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.5.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.5.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.6.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.6.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.6.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.7.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.7.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.7.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.8.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.8.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.8.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.9.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.9.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.9.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.10.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.10.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.10.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.11.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.11.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.11.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.12.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.12.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.12.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.13.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.13.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.13.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.14.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.14.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.14.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.15.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.15.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.15.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.16.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.16.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.16.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.17.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.17.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.17.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.18.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.18.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.18.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.19.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.19.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.19.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.20.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.20.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.20.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.21.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.21.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.21.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.22.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.22.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.22.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.23.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.23.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.23.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.24.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.24.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.24.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.25.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.25.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.25.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.26.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.26.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.26.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.27.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.27.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.27.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.28.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.28.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.28.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.29.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.29.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.29.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.30.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.30.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.30.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.31.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.31.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.31.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.32.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.32.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.32.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.33.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.33.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.33.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.34.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.34.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.34.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.35.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.35.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.35.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.36.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.36.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.36.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.37.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.37.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.37.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.38.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.38.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.38.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.39.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.39.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.39.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.40.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.40.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.40.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.41.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.41.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.41.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.42.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.42.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.42.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.43.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.43.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.43.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.44.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.44.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.44.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.45.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.45.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.45.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.46.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.46.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.46.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.47.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.47.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.47.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.48.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.48.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.48.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.49.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.49.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.49.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.50.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.50.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.50.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.51.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.51.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.51.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.52.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.52.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.52.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.53.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.53.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.53.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.54.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.54.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.54.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.55.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.55.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.55.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.56.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.56.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.56.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.57.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.57.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.57.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.58.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.58.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.58.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.59.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.59.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.59.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.60.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.60.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.60.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.61.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.61.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.61.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.62.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.62.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.62.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.63.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.63.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.63.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.64.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.64.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.64.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.65.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.65.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.65.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.66.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.66.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.66.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.67.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.67.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.67.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.68.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.68.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.68.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.69.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.69.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.69.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.70.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.70.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.70.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.71.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.71.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.71.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.72.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.72.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.72.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.73.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.73.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.73.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.74.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.74.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.74.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.75.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.75.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.75.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.76.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.76.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.76.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.77.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.77.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.77.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.78.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.78.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.78.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.79.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.79.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.79.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.80.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.80.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.80.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.81.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.81.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.81.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.82.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.82.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.82.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.83.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.83.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.83.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.84.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.84.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.84.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.85.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.85.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.85.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.86.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.86.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.86.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.87.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.87.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.87.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.88.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.88.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.88.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.89.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.89.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.89.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.90.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.90.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.90.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.91.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.91.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.91.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.92.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.92.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.92.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.93.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.93.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.93.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.94.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.94.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.94.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.95.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.95.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.95.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.96.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.96.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.96.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.97.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.97.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.97.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.98.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.98.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.98.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.99.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.99.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.99.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.100.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.100.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.100.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.101.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.101.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.101.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.102.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.102.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.102.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.103.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.103.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.103.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.104.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.104.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.104.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.105.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.105.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.105.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.106.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.106.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.106.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.107.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.107.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.107.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.108.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.108.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.108.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.109.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.109.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.109.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.110.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.110.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.110.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.111.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.111.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.111.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.112.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.112.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.112.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.113.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.113.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.113.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.114.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.114.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.114.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.115.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.115.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.115.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.116.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.116.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.116.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.117.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.117.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.117.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.118.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.118.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.118.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.119.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.119.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.119.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.120.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.120.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.120.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.121.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.121.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.121.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.122.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.122.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.122.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.123.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.123.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.123.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.124.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.124.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.124.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.125.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.125.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.125.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.126.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.126.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.126.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.127.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.127.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.127.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.128.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.128.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.128.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.129.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.129.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.129.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.130.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.130.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.130.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.131.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.131.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.131.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.132.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.132.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.132.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.133.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.133.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.133.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.134.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.134.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.134.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.135.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.135.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.135.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.136.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.136.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.136.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.137.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.137.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.137.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.138.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.138.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.138.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.139.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.139.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.139.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.140.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.140.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.140.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.141.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.141.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.141.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.142.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.142.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.142.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.143.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.143.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.143.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.144.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.144.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.144.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.145.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.145.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.145.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.146.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.146.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.146.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.147.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.147.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.147.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.148.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.148.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.148.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.149.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.149.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.149.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.150.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.150.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.150.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.151.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.151.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.151.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.152.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.152.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.152.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.153.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.153.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.153.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.154.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.154.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.154.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.155.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.155.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.155.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.156.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.156.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.156.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.157.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.157.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.157.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.158.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.158.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.158.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.159.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.159.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.159.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.160.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.160.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.160.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.161.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.161.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.161.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.162.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.162.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.162.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.163.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.163.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.163.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.164.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.164.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.164.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.165.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.165.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.165.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.166.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.166.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.166.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.167.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.167.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.167.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.168.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.168.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.168.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.169.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.169.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.169.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.170.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.170.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.170.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.171.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.171.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.171.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.172.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.172.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.172.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.173.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.173.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.173.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.174.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.174.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.174.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.175.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.175.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.175.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.176.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.176.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.176.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.177.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.177.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.177.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.178.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.178.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.178.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.179.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.179.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.179.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.180.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.180.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.180.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.181.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.181.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.181.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.182.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.182.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.182.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.183.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.183.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.183.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.184.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.184.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.184.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.185.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.185.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.185.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.186.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.186.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.186.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.187.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.187.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.187.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.188.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.188.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.188.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.189.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.189.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.189.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.190.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.190.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.190.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.191.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.191.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.191.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.192.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.192.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.192.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.193.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.193.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.193.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.194.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.194.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.194.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.195.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.195.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.195.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.196.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.196.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.196.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.197.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.197.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.197.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.198.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.198.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.198.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.199.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.199.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.199.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.200.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.200.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.200.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.201.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.201.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.201.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.202.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.202.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.202.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.203.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.203.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.203.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.204.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.204.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.204.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.205.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.205.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.205.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.206.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.206.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.206.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.207.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.207.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.207.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.208.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.208.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.208.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.209.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.209.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.209.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.210.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.210.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.210.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.211.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.211.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.211.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.212.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.212.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.212.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.213.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.213.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.213.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.214.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.214.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.214.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.215.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.215.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.215.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.216.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.216.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.216.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.217.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.217.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.217.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.218.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.218.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.218.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.219.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.219.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.219.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.220.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.220.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.220.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.221.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.221.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.221.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.222.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.222.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.222.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.223.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.223.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.223.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.224.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.224.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.224.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.225.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.225.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.225.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.226.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.226.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.226.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.227.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.227.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.227.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.228.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.228.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.228.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.229.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.229.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.229.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.230.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.230.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.230.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.231.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.231.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.231.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.232.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.232.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.232.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.233.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.233.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.233.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.234.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.234.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.234.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.235.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.235.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.235.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.236.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.236.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.236.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.237.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.237.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.237.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.238.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.238.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.238.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.239.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.239.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.239.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.240.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.240.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.240.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.241.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.241.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.241.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.242.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.242.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.242.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.243.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.243.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.243.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.244.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.244.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.244.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.245.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.245.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.245.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.246.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.246.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.246.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.247.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.247.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.247.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.248.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.248.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.248.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.249.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.249.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.249.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.250.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.250.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.250.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.251.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.251.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.251.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.252.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.252.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.252.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.253.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.253.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.253.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.254.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.254.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.254.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.255.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.255.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.255.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.input_layernorm.weight": "model-00111-of-000163.safetensors", + "model.layers.42.post_attention_layernorm.weight": "model-00111-of-000163.safetensors", + "model.layers.43.self_attn.q_a_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.self_attn.q_a_layernorm.weight": "model-00111-of-000163.safetensors", + "model.layers.43.self_attn.q_b_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.self_attn.kv_a_proj_with_mqa.weight": "model-00111-of-000163.safetensors", + "model.layers.43.self_attn.kv_a_layernorm.weight": "model-00111-of-000163.safetensors", + "model.layers.43.self_attn.kv_b_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.self_attn.o_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.gate.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.gate.e_score_correction_bias": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.shared_experts.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.shared_experts.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.shared_experts.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.0.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.0.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.0.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.1.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.1.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.1.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.2.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.2.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.2.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.3.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.3.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.3.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.4.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.4.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.4.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.5.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.5.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.5.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.6.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.6.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.6.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.7.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.7.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.7.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.8.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.8.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.8.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.9.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.9.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.9.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.10.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.10.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.10.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.11.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.11.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.11.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.12.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.12.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.12.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.13.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.13.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.13.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.14.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.14.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.14.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.15.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.15.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.15.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.16.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.16.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.16.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.17.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.17.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.17.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.18.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.18.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.18.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.19.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.19.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.19.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.20.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.20.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.20.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.21.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.21.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.21.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.22.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.22.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.22.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.23.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.23.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.23.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.24.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.24.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.24.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.25.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.25.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.25.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.26.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.26.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.26.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.27.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.27.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.27.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.28.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.28.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.28.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.29.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.29.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.29.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.30.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.30.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.30.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.31.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.31.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.31.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.32.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.32.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.32.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.33.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.33.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.33.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.34.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.34.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.34.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.35.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.35.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.35.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.36.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.36.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.36.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.37.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.37.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.37.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.38.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.38.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.38.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.39.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.39.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.39.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.40.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.40.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.40.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.41.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.41.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.41.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.42.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.42.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.42.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.43.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.43.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.43.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.44.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.44.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.44.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.45.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.45.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.45.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.46.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.46.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.46.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.47.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.47.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.47.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.48.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.48.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.48.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.49.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.49.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.49.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.50.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.50.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.50.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.51.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.51.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.51.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.52.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.52.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.52.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.53.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.53.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.53.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.54.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.54.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.54.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.55.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.55.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.55.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.56.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.56.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.56.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.57.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.57.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.57.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.58.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.58.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.58.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.59.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.59.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.59.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.60.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.60.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.60.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.61.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.61.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.61.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.62.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.62.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.62.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.63.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.63.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.63.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.64.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.64.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.64.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.65.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.65.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.65.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.66.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.66.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.66.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.67.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.67.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.67.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.68.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.68.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.68.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.69.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.69.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.69.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.70.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.70.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.70.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.71.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.71.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.71.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.72.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.72.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.72.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.73.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.73.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.73.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.74.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.74.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.74.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.75.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.75.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.75.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.76.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.76.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.76.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.77.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.77.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.77.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.78.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.78.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.78.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.79.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.79.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.79.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.80.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.80.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.80.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.81.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.81.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.81.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.82.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.82.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.82.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.83.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.83.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.83.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.84.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.84.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.84.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.85.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.85.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.85.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.86.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.86.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.86.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.87.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.87.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.87.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.88.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.88.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.88.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.89.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.89.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.89.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.90.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.90.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.90.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.91.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.91.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.91.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.92.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.92.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.92.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.93.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.93.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.93.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.94.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.94.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.94.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.95.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.95.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.95.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.96.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.96.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.96.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.97.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.97.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.97.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.98.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.98.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.98.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.99.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.99.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.99.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.100.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.100.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.100.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.101.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.101.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.101.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.102.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.102.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.102.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.103.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.103.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.103.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.104.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.104.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.104.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.105.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.105.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.105.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.106.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.106.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.106.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.107.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.107.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.107.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.108.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.108.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.108.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.109.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.109.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.109.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.110.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.110.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.110.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.111.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.111.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.111.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.112.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.112.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.112.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.113.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.113.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.113.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.114.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.114.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.114.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.115.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.115.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.115.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.116.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.116.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.116.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.117.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.117.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.117.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.118.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.118.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.118.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.119.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.119.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.119.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.120.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.120.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.120.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.121.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.121.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.121.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.122.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.122.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.122.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.123.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.123.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.123.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.124.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.124.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.124.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.125.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.125.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.125.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.126.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.126.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.126.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.127.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.127.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.127.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.128.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.128.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.128.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.129.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.129.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.129.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.130.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.130.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.130.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.131.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.131.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.131.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.132.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.132.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.132.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.133.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.133.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.133.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.134.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.134.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.134.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.135.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.135.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.135.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.136.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.136.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.136.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.137.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.137.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.137.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.138.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.138.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.138.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.139.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.139.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.139.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.140.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.140.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.140.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.141.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.141.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.141.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.142.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.142.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.142.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.143.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.143.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.143.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.144.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.144.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.144.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.145.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.145.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.145.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.146.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.146.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.146.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.147.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.147.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.147.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.148.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.148.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.148.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.149.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.149.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.149.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.150.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.150.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.150.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.151.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.151.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.151.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.152.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.152.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.152.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.153.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.153.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.153.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.154.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.154.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.154.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.155.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.155.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.155.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.156.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.156.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.156.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.157.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.157.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.157.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.158.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.158.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.158.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.159.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.159.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.159.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.160.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.160.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.160.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.161.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.161.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.161.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.162.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.162.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.162.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.163.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.163.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.163.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.164.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.164.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.164.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.165.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.165.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.165.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.166.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.166.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.166.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.167.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.167.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.167.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.168.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.168.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.168.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.169.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.169.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.169.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.170.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.170.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.170.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.171.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.171.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.171.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.172.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.172.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.172.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.173.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.173.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.173.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.174.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.174.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.174.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.175.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.175.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.175.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.176.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.176.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.176.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.177.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.177.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.177.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.178.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.178.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.178.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.179.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.179.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.179.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.180.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.180.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.180.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.181.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.181.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.181.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.182.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.182.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.182.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.183.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.183.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.183.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.184.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.184.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.184.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.185.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.185.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.185.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.186.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.186.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.186.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.187.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.187.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.187.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.188.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.188.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.188.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.189.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.189.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.189.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.190.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.190.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.190.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.191.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.191.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.191.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.192.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.192.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.192.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.193.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.193.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.193.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.194.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.194.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.194.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.195.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.195.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.195.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.196.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.196.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.196.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.197.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.197.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.197.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.198.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.198.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.198.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.199.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.199.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.199.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.200.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.200.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.200.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.201.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.201.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.201.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.202.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.202.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.202.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.203.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.203.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.203.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.204.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.204.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.204.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.205.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.205.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.205.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.206.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.206.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.206.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.207.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.207.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.207.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.208.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.208.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.208.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.209.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.209.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.209.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.210.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.210.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.210.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.211.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.211.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.211.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.212.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.212.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.212.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.213.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.213.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.213.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.214.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.214.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.214.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.215.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.215.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.215.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.216.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.216.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.216.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.217.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.217.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.217.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.218.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.218.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.218.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.219.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.219.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.219.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.220.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.220.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.220.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.221.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.221.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.221.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.222.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.222.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.222.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.223.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.223.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.223.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.224.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.224.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.224.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.225.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.225.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.225.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.226.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.226.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.226.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.227.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.227.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.227.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.228.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.228.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.228.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.229.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.229.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.229.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.230.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.230.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.230.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.231.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.231.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.231.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.232.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.232.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.232.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.233.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.233.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.233.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.234.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.234.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.234.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.235.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.235.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.235.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.236.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.236.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.236.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.237.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.237.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.237.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.238.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.238.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.238.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.239.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.239.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.239.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.240.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.240.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.240.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.241.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.241.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.241.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.242.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.242.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.242.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.243.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.243.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.243.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.244.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.244.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.244.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.245.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.245.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.245.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.246.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.246.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.246.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.247.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.247.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.247.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.248.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.248.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.248.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.249.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.249.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.249.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.250.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.250.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.250.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.251.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.251.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.251.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.252.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.252.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.252.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.253.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.253.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.253.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.254.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.254.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.254.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.255.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.255.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.255.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.input_layernorm.weight": "model-00114-of-000163.safetensors", + "model.layers.43.post_attention_layernorm.weight": "model-00114-of-000163.safetensors", + "model.layers.44.self_attn.q_a_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.self_attn.q_a_layernorm.weight": "model-00114-of-000163.safetensors", + "model.layers.44.self_attn.q_b_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.self_attn.kv_a_proj_with_mqa.weight": "model-00114-of-000163.safetensors", + "model.layers.44.self_attn.kv_a_layernorm.weight": "model-00114-of-000163.safetensors", + "model.layers.44.self_attn.kv_b_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.self_attn.o_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.gate.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.gate.e_score_correction_bias": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.shared_experts.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.shared_experts.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.shared_experts.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.0.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.0.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.0.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.1.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.1.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.1.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.2.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.2.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.2.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.3.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.3.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.3.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.4.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.4.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.4.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.5.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.5.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.5.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.6.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.6.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.6.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.7.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.7.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.7.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.8.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.8.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.8.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.9.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.9.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.9.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.10.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.10.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.10.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.11.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.11.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.11.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.12.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.12.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.12.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.13.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.13.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.13.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.14.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.14.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.14.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.15.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.15.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.15.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.16.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.16.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.16.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.17.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.17.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.17.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.18.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.18.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.18.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.19.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.19.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.19.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.20.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.20.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.20.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.21.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.21.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.21.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.22.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.22.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.22.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.23.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.23.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.23.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.24.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.24.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.24.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.25.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.25.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.25.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.26.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.26.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.26.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.27.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.27.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.27.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.28.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.28.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.28.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.29.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.29.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.29.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.30.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.30.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.30.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.31.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.31.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.31.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.32.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.32.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.32.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.33.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.33.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.33.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.34.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.34.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.34.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.35.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.35.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.35.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.36.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.36.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.36.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.37.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.37.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.37.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.38.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.38.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.38.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.39.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.39.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.39.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.40.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.40.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.40.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.41.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.41.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.41.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.42.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.42.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.42.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.43.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.43.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.43.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.44.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.44.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.44.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.45.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.45.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.45.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.46.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.46.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.46.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.47.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.47.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.47.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.48.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.48.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.48.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.49.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.49.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.49.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.50.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.50.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.50.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.51.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.51.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.51.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.52.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.52.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.52.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.53.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.53.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.53.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.54.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.54.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.54.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.55.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.55.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.55.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.56.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.56.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.56.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.57.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.57.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.57.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.58.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.58.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.58.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.59.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.59.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.59.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.60.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.60.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.60.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.61.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.61.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.61.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.62.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.62.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.62.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.63.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.63.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.63.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.64.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.64.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.64.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.65.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.65.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.65.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.66.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.66.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.66.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.67.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.67.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.67.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.68.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.68.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.68.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.69.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.69.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.69.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.70.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.70.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.70.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.71.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.71.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.71.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.72.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.72.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.72.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.73.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.73.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.73.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.74.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.74.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.74.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.75.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.75.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.75.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.76.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.76.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.76.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.77.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.77.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.77.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.78.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.78.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.78.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.79.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.79.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.79.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.80.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.80.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.80.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.81.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.81.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.81.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.82.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.82.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.82.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.83.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.83.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.83.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.84.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.84.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.84.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.85.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.85.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.85.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.86.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.86.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.86.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.87.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.87.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.87.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.88.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.88.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.88.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.89.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.89.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.89.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.90.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.90.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.90.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.91.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.91.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.91.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.92.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.92.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.92.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.93.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.93.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.93.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.94.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.94.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.94.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.95.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.95.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.95.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.96.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.96.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.96.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.97.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.97.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.97.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.98.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.98.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.98.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.99.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.99.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.99.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.100.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.100.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.100.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.101.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.101.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.101.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.102.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.102.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.102.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.103.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.103.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.103.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.104.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.104.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.104.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.105.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.105.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.105.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.106.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.106.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.106.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.107.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.107.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.107.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.108.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.108.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.108.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.109.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.109.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.109.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.110.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.110.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.110.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.111.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.111.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.111.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.112.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.112.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.112.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.113.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.113.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.113.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.114.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.114.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.114.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.115.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.115.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.115.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.116.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.116.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.116.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.117.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.117.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.117.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.118.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.118.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.118.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.119.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.119.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.119.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.120.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.120.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.120.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.121.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.121.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.121.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.122.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.122.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.122.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.123.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.123.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.123.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.124.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.124.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.124.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.125.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.125.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.125.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.126.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.126.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.126.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.127.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.127.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.127.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.128.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.128.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.128.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.129.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.129.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.129.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.130.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.130.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.130.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.131.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.131.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.131.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.132.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.132.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.132.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.133.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.133.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.133.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.134.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.134.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.134.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.135.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.135.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.135.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.136.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.136.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.136.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.137.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.137.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.137.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.138.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.138.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.138.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.139.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.139.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.139.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.140.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.140.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.140.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.141.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.141.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.141.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.142.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.142.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.142.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.143.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.143.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.143.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.144.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.144.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.144.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.145.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.145.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.145.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.146.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.146.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.146.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.147.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.147.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.147.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.148.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.148.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.148.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.149.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.149.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.149.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.150.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.150.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.150.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.151.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.151.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.151.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.152.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.152.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.152.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.153.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.153.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.153.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.154.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.154.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.154.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.155.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.155.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.155.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.156.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.156.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.156.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.157.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.157.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.157.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.158.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.158.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.158.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.159.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.159.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.159.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.160.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.160.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.160.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.161.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.161.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.161.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.162.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.162.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.162.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.163.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.163.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.163.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.164.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.164.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.164.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.165.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.165.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.165.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.166.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.166.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.166.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.167.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.167.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.167.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.168.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.168.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.168.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.169.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.169.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.169.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.170.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.170.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.170.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.171.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.171.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.171.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.172.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.172.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.172.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.173.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.173.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.173.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.174.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.174.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.174.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.175.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.175.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.175.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.176.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.176.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.176.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.177.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.177.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.177.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.178.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.178.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.178.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.179.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.179.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.179.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.180.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.180.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.180.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.181.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.181.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.181.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.182.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.182.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.182.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.183.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.183.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.183.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.184.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.184.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.184.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.185.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.185.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.185.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.186.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.186.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.186.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.187.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.187.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.187.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.188.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.188.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.188.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.189.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.189.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.189.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.190.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.190.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.190.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.191.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.191.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.191.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.192.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.192.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.192.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.193.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.193.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.193.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.194.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.194.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.194.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.195.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.195.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.195.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.196.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.196.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.196.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.197.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.197.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.197.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.198.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.198.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.198.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.199.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.199.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.199.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.200.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.200.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.200.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.201.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.201.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.201.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.202.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.202.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.202.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.203.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.203.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.203.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.204.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.204.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.204.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.205.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.205.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.205.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.206.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.206.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.206.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.207.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.207.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.207.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.208.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.208.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.208.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.209.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.209.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.209.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.210.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.210.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.210.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.211.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.211.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.211.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.212.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.212.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.212.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.213.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.213.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.213.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.214.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.214.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.214.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.215.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.215.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.215.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.216.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.216.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.216.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.217.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.217.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.217.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.218.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.218.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.218.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.219.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.219.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.219.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.220.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.220.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.220.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.221.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.221.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.221.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.222.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.222.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.222.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.223.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.223.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.223.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.224.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.224.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.224.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.225.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.225.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.225.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.226.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.226.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.226.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.227.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.227.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.227.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.228.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.228.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.228.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.229.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.229.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.229.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.230.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.230.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.230.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.231.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.231.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.231.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.232.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.232.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.232.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.233.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.233.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.233.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.234.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.234.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.234.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.235.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.235.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.235.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.236.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.236.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.236.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.237.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.237.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.237.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.238.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.238.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.238.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.239.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.239.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.239.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.240.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.240.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.240.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.241.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.241.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.241.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.242.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.242.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.242.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.243.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.243.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.243.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.244.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.244.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.244.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.245.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.245.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.245.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.246.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.246.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.246.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.247.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.247.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.247.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.248.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.248.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.248.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.249.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.249.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.249.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.250.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.250.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.250.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.251.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.251.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.251.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.252.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.252.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.252.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.253.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.253.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.253.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.254.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.254.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.254.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.255.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.255.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.255.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.input_layernorm.weight": "model-00117-of-000163.safetensors", + "model.layers.44.post_attention_layernorm.weight": "model-00117-of-000163.safetensors", + "model.layers.45.self_attn.q_a_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.self_attn.q_a_layernorm.weight": "model-00117-of-000163.safetensors", + "model.layers.45.self_attn.q_b_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.self_attn.kv_a_proj_with_mqa.weight": "model-00117-of-000163.safetensors", + "model.layers.45.self_attn.kv_a_layernorm.weight": "model-00117-of-000163.safetensors", + "model.layers.45.self_attn.kv_b_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.self_attn.o_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.gate.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.gate.e_score_correction_bias": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.shared_experts.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.shared_experts.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.shared_experts.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.0.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.0.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.0.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.1.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.1.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.1.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.2.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.2.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.2.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.3.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.3.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.3.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.4.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.4.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.4.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.5.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.5.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.5.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.6.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.6.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.6.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.7.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.7.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.7.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.8.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.8.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.8.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.9.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.9.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.9.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.10.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.10.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.10.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.11.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.11.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.11.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.12.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.12.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.12.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.13.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.13.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.13.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.14.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.14.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.14.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.15.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.15.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.15.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.16.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.16.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.16.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.17.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.17.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.17.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.18.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.18.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.18.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.19.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.19.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.19.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.20.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.20.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.20.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.21.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.21.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.21.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.22.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.22.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.22.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.23.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.23.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.23.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.24.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.24.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.24.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.25.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.25.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.25.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.26.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.26.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.26.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.27.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.27.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.27.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.28.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.28.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.28.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.29.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.29.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.29.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.30.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.30.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.30.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.31.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.31.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.31.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.32.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.32.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.32.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.33.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.33.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.33.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.34.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.34.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.34.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.35.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.35.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.35.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.36.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.36.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.36.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.37.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.37.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.37.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.38.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.38.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.38.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.39.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.39.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.39.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.40.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.40.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.40.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.41.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.41.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.41.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.42.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.42.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.42.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.43.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.43.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.43.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.44.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.44.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.44.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.45.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.45.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.45.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.46.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.46.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.46.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.47.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.47.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.47.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.48.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.48.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.48.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.49.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.49.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.49.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.50.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.50.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.50.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.51.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.51.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.51.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.52.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.52.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.52.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.53.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.53.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.53.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.54.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.54.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.54.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.55.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.55.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.55.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.56.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.56.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.56.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.57.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.57.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.57.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.58.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.58.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.58.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.59.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.59.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.59.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.60.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.60.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.60.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.61.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.61.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.61.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.62.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.62.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.62.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.63.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.63.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.63.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.64.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.64.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.64.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.65.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.65.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.65.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.66.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.66.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.66.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.67.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.67.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.67.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.68.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.68.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.68.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.69.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.69.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.69.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.70.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.70.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.70.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.71.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.71.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.71.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.72.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.72.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.72.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.73.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.73.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.73.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.74.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.74.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.74.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.75.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.75.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.75.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.76.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.76.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.76.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.77.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.77.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.77.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.78.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.78.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.78.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.79.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.79.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.79.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.80.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.80.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.80.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.81.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.81.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.81.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.82.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.82.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.82.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.83.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.83.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.83.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.84.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.84.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.84.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.85.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.85.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.85.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.86.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.86.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.86.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.87.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.87.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.87.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.88.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.88.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.88.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.89.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.89.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.89.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.90.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.90.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.90.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.91.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.91.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.91.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.92.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.92.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.92.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.93.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.93.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.93.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.94.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.94.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.94.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.95.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.95.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.95.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.96.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.96.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.96.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.97.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.97.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.97.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.98.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.98.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.98.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.99.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.99.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.99.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.100.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.100.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.100.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.101.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.101.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.101.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.102.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.102.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.102.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.103.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.103.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.103.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.104.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.104.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.104.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.105.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.105.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.105.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.106.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.106.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.106.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.107.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.107.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.107.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.108.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.108.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.108.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.109.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.109.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.109.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.110.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.110.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.110.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.111.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.111.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.111.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.112.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.112.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.112.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.113.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.113.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.113.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.114.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.114.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.114.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.115.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.115.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.115.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.116.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.116.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.116.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.117.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.117.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.117.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.118.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.118.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.118.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.119.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.119.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.119.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.120.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.120.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.120.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.121.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.121.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.121.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.122.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.122.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.122.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.123.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.123.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.123.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.124.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.124.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.124.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.125.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.125.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.125.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.126.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.126.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.126.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.127.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.127.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.127.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.128.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.128.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.128.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.129.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.129.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.129.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.130.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.130.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.130.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.131.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.131.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.131.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.132.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.132.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.132.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.133.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.133.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.133.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.134.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.134.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.134.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.135.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.135.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.135.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.136.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.136.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.136.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.137.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.137.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.137.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.138.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.138.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.138.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.139.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.139.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.139.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.140.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.140.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.140.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.141.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.141.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.141.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.142.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.142.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.142.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.143.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.143.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.143.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.144.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.144.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.144.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.145.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.145.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.145.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.146.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.146.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.146.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.147.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.147.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.147.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.148.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.148.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.148.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.149.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.149.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.149.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.150.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.150.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.150.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.151.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.151.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.151.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.152.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.152.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.152.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.153.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.153.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.153.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.154.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.154.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.154.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.155.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.155.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.155.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.156.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.156.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.156.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.157.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.157.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.157.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.158.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.158.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.158.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.159.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.159.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.159.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.160.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.160.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.160.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.161.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.161.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.161.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.162.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.162.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.162.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.163.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.163.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.163.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.164.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.164.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.164.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.165.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.165.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.165.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.166.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.166.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.166.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.167.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.167.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.167.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.168.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.168.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.168.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.169.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.169.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.169.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.170.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.170.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.170.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.171.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.171.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.171.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.172.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.172.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.172.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.173.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.173.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.173.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.174.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.174.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.174.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.175.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.175.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.175.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.176.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.176.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.176.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.177.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.177.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.177.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.178.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.178.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.178.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.179.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.179.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.179.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.180.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.180.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.180.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.181.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.181.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.181.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.182.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.182.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.182.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.183.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.183.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.183.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.184.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.184.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.184.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.185.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.185.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.185.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.186.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.186.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.186.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.187.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.187.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.187.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.188.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.188.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.188.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.189.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.189.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.189.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.190.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.190.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.190.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.191.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.191.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.191.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.192.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.192.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.192.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.193.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.193.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.193.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.194.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.194.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.194.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.195.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.195.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.195.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.196.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.196.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.196.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.197.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.197.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.197.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.198.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.198.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.198.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.199.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.199.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.199.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.200.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.200.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.200.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.201.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.201.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.201.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.202.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.202.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.202.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.203.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.203.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.203.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.204.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.204.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.204.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.205.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.205.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.205.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.206.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.206.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.206.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.207.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.207.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.207.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.208.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.208.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.208.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.209.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.209.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.209.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.210.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.210.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.210.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.211.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.211.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.211.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.212.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.212.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.212.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.213.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.213.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.213.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.214.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.214.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.214.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.215.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.215.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.215.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.216.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.216.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.216.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.217.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.217.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.217.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.218.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.218.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.218.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.219.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.219.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.219.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.220.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.220.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.220.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.221.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.221.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.221.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.222.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.222.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.222.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.223.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.223.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.223.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.224.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.224.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.224.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.225.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.225.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.225.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.226.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.226.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.226.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.227.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.227.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.227.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.228.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.228.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.228.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.229.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.229.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.229.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.230.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.230.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.230.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.231.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.231.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.231.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.232.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.232.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.232.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.233.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.233.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.233.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.234.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.234.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.234.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.235.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.235.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.235.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.236.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.236.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.236.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.237.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.237.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.237.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.238.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.238.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.238.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.239.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.239.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.239.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.240.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.240.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.240.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.241.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.241.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.241.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.242.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.242.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.242.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.243.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.243.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.243.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.244.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.244.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.244.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.245.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.245.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.245.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.246.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.246.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.246.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.247.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.247.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.247.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.248.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.248.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.248.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.249.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.249.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.249.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.250.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.250.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.250.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.251.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.251.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.251.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.252.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.252.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.252.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.253.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.253.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.253.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.254.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.254.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.254.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.255.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.255.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.255.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.input_layernorm.weight": "model-00119-of-000163.safetensors", + "model.layers.45.post_attention_layernorm.weight": "model-00119-of-000163.safetensors", + "model.layers.46.self_attn.q_a_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.self_attn.q_a_layernorm.weight": "model-00119-of-000163.safetensors", + "model.layers.46.self_attn.q_b_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.self_attn.kv_a_proj_with_mqa.weight": "model-00119-of-000163.safetensors", + "model.layers.46.self_attn.kv_a_layernorm.weight": "model-00119-of-000163.safetensors", + "model.layers.46.self_attn.kv_b_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.self_attn.o_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.gate.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.gate.e_score_correction_bias": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.shared_experts.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.shared_experts.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.shared_experts.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.0.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.0.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.0.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.1.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.1.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.1.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.2.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.2.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.2.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.3.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.3.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.3.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.4.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.4.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.4.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.5.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.5.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.5.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.6.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.6.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.6.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.7.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.7.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.7.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.8.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.8.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.8.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.9.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.9.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.9.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.10.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.10.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.10.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.11.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.11.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.11.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.12.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.12.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.12.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.13.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.13.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.13.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.14.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.14.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.14.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.15.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.15.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.15.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.16.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.16.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.16.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.17.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.17.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.17.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.18.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.18.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.18.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.19.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.19.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.19.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.20.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.20.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.20.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.21.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.21.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.21.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.22.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.22.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.22.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.23.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.23.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.23.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.24.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.24.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.24.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.25.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.25.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.25.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.26.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.26.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.26.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.27.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.27.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.27.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.28.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.28.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.28.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.29.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.29.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.29.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.30.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.30.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.30.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.31.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.31.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.31.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.32.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.32.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.32.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.33.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.33.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.33.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.34.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.34.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.34.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.35.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.35.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.35.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.36.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.36.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.36.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.37.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.37.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.37.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.38.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.38.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.38.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.39.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.39.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.39.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.40.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.40.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.40.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.41.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.41.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.41.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.42.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.42.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.42.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.43.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.43.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.43.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.44.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.44.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.44.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.45.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.45.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.45.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.46.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.46.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.46.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.47.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.47.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.47.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.48.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.48.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.48.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.49.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.49.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.49.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.50.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.50.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.50.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.51.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.51.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.51.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.52.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.52.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.52.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.53.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.53.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.53.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.54.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.54.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.54.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.55.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.55.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.55.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.56.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.56.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.56.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.57.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.57.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.57.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.58.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.58.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.58.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.59.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.59.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.59.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.60.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.60.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.60.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.61.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.61.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.61.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.62.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.62.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.62.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.63.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.63.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.63.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.64.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.64.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.64.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.65.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.65.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.65.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.66.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.66.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.66.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.67.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.67.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.67.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.68.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.68.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.68.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.69.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.69.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.69.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.70.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.70.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.70.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.71.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.71.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.71.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.72.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.72.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.72.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.73.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.73.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.73.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.74.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.74.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.74.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.75.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.75.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.75.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.76.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.76.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.76.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.77.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.77.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.77.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.78.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.78.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.78.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.79.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.79.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.79.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.80.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.80.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.80.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.81.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.81.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.81.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.82.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.82.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.82.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.83.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.83.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.83.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.84.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.84.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.84.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.85.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.85.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.85.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.86.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.86.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.86.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.87.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.87.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.87.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.88.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.88.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.88.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.89.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.89.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.89.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.90.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.90.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.90.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.91.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.91.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.91.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.92.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.92.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.92.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.93.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.93.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.93.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.94.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.94.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.94.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.95.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.95.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.95.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.96.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.96.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.96.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.97.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.97.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.97.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.98.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.98.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.98.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.99.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.99.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.99.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.100.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.100.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.100.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.101.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.101.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.101.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.102.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.102.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.102.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.103.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.103.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.103.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.104.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.104.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.104.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.105.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.105.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.105.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.106.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.106.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.106.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.107.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.107.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.107.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.108.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.108.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.108.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.109.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.109.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.109.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.110.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.110.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.110.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.111.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.111.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.111.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.112.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.112.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.112.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.113.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.113.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.113.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.114.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.114.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.114.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.115.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.115.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.115.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.116.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.116.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.116.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.117.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.117.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.117.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.118.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.118.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.118.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.119.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.119.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.119.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.120.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.120.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.120.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.121.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.121.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.121.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.122.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.122.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.122.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.123.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.123.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.123.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.124.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.124.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.124.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.125.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.125.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.125.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.126.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.126.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.126.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.127.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.127.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.127.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.128.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.128.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.128.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.129.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.129.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.129.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.130.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.130.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.130.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.131.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.131.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.131.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.132.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.132.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.132.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.133.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.133.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.133.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.134.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.134.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.134.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.135.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.135.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.135.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.136.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.136.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.136.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.137.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.137.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.137.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.138.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.138.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.138.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.139.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.139.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.139.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.140.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.140.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.140.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.141.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.141.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.141.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.142.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.142.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.142.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.143.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.143.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.143.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.144.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.144.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.144.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.145.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.145.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.145.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.146.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.146.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.146.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.147.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.147.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.147.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.148.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.148.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.148.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.149.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.149.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.149.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.150.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.150.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.150.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.151.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.151.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.151.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.152.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.152.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.152.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.153.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.153.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.153.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.154.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.154.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.154.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.155.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.155.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.155.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.156.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.156.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.156.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.157.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.157.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.157.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.158.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.158.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.158.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.159.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.159.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.159.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.160.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.160.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.160.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.161.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.161.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.161.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.162.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.162.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.162.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.163.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.163.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.163.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.164.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.164.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.164.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.165.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.165.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.165.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.166.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.166.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.166.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.167.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.167.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.167.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.168.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.168.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.168.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.169.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.169.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.169.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.170.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.170.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.170.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.171.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.171.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.171.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.172.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.172.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.172.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.173.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.173.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.173.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.174.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.174.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.174.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.175.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.175.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.175.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.176.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.176.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.176.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.177.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.177.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.177.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.178.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.178.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.178.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.179.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.179.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.179.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.180.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.180.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.180.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.181.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.181.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.181.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.182.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.182.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.182.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.183.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.183.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.183.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.184.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.184.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.184.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.185.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.185.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.185.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.186.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.186.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.186.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.187.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.187.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.187.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.188.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.188.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.188.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.189.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.189.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.189.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.190.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.190.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.190.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.191.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.191.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.191.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.192.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.192.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.192.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.193.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.193.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.193.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.194.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.194.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.194.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.195.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.195.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.195.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.196.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.196.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.196.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.197.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.197.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.197.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.198.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.198.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.198.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.199.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.199.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.199.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.200.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.200.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.200.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.201.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.201.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.201.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.202.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.202.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.202.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.203.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.203.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.203.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.204.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.204.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.204.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.205.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.205.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.205.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.206.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.206.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.206.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.207.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.207.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.207.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.208.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.208.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.208.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.209.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.209.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.209.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.210.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.210.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.210.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.211.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.211.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.211.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.212.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.212.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.212.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.213.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.213.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.213.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.214.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.214.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.214.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.215.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.215.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.215.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.216.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.216.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.216.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.217.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.217.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.217.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.218.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.218.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.218.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.219.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.219.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.219.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.220.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.220.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.220.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.221.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.221.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.221.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.222.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.222.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.222.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.223.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.223.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.223.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.224.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.224.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.224.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.225.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.225.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.225.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.226.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.226.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.226.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.227.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.227.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.227.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.228.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.228.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.228.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.229.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.229.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.229.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.230.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.230.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.230.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.231.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.231.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.231.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.232.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.232.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.232.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.233.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.233.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.233.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.234.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.234.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.234.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.235.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.235.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.235.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.236.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.236.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.236.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.237.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.237.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.237.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.238.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.238.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.238.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.239.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.239.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.239.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.240.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.240.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.240.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.241.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.241.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.241.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.242.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.242.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.242.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.243.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.243.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.243.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.244.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.244.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.244.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.245.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.245.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.245.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.246.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.246.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.246.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.247.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.247.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.247.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.248.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.248.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.248.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.249.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.249.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.249.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.250.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.250.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.250.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.251.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.251.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.251.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.252.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.252.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.252.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.253.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.253.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.253.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.254.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.254.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.254.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.255.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.255.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.255.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.input_layernorm.weight": "model-00122-of-000163.safetensors", + "model.layers.46.post_attention_layernorm.weight": "model-00122-of-000163.safetensors", + "model.layers.47.self_attn.q_a_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.self_attn.q_a_layernorm.weight": "model-00123-of-000163.safetensors", + "model.layers.47.self_attn.q_b_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.self_attn.kv_a_proj_with_mqa.weight": "model-00123-of-000163.safetensors", + "model.layers.47.self_attn.kv_a_layernorm.weight": "model-00123-of-000163.safetensors", + "model.layers.47.self_attn.kv_b_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.self_attn.o_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.gate.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.gate.e_score_correction_bias": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.shared_experts.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.shared_experts.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.shared_experts.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.0.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.0.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.0.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.1.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.1.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.1.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.2.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.2.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.2.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.3.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.3.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.3.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.4.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.4.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.4.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.5.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.5.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.5.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.6.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.6.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.6.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.7.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.7.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.7.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.8.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.8.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.8.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.9.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.9.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.9.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.10.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.10.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.10.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.11.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.11.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.11.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.12.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.12.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.12.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.13.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.13.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.13.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.14.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.14.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.14.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.15.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.15.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.15.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.16.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.16.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.16.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.17.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.17.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.17.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.18.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.18.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.18.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.19.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.19.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.19.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.20.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.20.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.20.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.21.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.21.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.21.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.22.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.22.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.22.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.23.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.23.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.23.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.24.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.24.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.24.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.25.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.25.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.25.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.26.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.26.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.26.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.27.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.27.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.27.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.28.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.28.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.28.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.29.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.29.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.29.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.30.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.30.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.30.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.31.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.31.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.31.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.32.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.32.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.32.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.33.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.33.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.33.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.34.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.34.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.34.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.35.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.35.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.35.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.36.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.36.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.36.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.37.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.37.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.37.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.38.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.38.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.38.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.39.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.39.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.39.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.40.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.40.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.40.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.41.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.41.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.41.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.42.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.42.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.42.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.43.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.43.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.43.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.44.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.44.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.44.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.45.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.45.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.45.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.46.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.46.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.46.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.47.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.47.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.47.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.48.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.48.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.48.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.49.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.49.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.49.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.50.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.50.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.50.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.51.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.51.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.51.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.52.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.52.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.52.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.53.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.53.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.53.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.54.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.54.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.54.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.55.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.55.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.55.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.56.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.56.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.56.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.57.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.57.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.57.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.58.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.58.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.58.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.59.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.59.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.59.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.60.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.60.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.60.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.61.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.61.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.61.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.62.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.62.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.62.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.63.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.63.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.63.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.64.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.64.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.64.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.65.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.65.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.65.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.66.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.66.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.66.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.67.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.67.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.67.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.68.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.68.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.68.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.69.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.69.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.69.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.70.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.70.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.70.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.71.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.71.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.71.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.72.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.72.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.72.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.73.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.73.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.73.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.74.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.74.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.74.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.75.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.75.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.75.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.76.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.76.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.76.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.77.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.77.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.77.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.78.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.78.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.78.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.79.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.79.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.79.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.80.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.80.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.80.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.81.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.81.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.81.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.82.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.82.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.82.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.83.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.83.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.83.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.84.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.84.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.84.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.85.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.85.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.85.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.86.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.86.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.86.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.87.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.87.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.87.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.88.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.88.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.88.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.89.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.89.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.89.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.90.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.90.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.90.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.91.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.91.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.91.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.92.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.92.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.92.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.93.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.93.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.93.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.94.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.94.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.94.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.95.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.95.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.95.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.96.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.96.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.96.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.97.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.97.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.97.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.98.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.98.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.98.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.99.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.99.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.99.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.100.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.100.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.100.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.101.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.101.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.101.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.102.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.102.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.102.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.103.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.103.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.103.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.104.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.104.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.104.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.105.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.105.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.105.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.106.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.106.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.106.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.107.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.107.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.107.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.108.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.108.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.108.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.109.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.109.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.109.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.110.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.110.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.110.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.111.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.111.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.111.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.112.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.112.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.112.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.113.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.113.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.113.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.114.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.114.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.114.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.115.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.115.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.115.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.116.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.116.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.116.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.117.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.117.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.117.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.118.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.118.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.118.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.119.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.119.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.119.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.120.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.120.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.120.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.121.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.121.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.121.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.122.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.122.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.122.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.123.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.123.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.123.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.124.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.124.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.124.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.125.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.125.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.125.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.126.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.126.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.126.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.127.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.127.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.127.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.128.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.128.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.128.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.129.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.129.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.129.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.130.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.130.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.130.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.131.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.131.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.131.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.132.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.132.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.132.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.133.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.133.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.133.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.134.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.134.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.134.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.135.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.135.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.135.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.136.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.136.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.136.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.137.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.137.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.137.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.138.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.138.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.138.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.139.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.139.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.139.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.140.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.140.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.140.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.141.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.141.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.141.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.142.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.142.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.142.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.143.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.143.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.143.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.144.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.144.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.144.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.145.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.145.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.145.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.146.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.146.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.146.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.147.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.147.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.147.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.148.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.148.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.148.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.149.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.149.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.149.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.150.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.150.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.150.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.151.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.151.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.151.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.152.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.152.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.152.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.153.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.153.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.153.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.154.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.154.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.154.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.155.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.155.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.155.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.156.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.156.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.156.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.157.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.157.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.157.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.158.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.158.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.158.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.159.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.159.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.159.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.160.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.160.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.160.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.161.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.161.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.161.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.162.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.162.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.162.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.163.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.163.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.163.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.164.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.164.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.164.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.165.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.165.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.165.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.166.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.166.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.166.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.167.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.167.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.167.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.168.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.168.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.168.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.169.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.169.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.169.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.170.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.170.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.170.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.171.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.171.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.171.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.172.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.172.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.172.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.173.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.173.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.173.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.174.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.174.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.174.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.175.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.175.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.175.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.176.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.176.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.176.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.177.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.177.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.177.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.178.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.178.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.178.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.179.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.179.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.179.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.180.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.180.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.180.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.181.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.181.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.181.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.182.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.182.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.182.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.183.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.183.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.183.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.184.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.184.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.184.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.185.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.185.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.185.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.186.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.186.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.186.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.187.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.187.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.187.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.188.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.188.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.188.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.189.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.189.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.189.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.190.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.190.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.190.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.191.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.191.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.191.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.192.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.192.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.192.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.193.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.193.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.193.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.194.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.194.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.194.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.195.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.195.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.195.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.196.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.196.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.196.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.197.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.197.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.197.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.198.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.198.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.198.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.199.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.199.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.199.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.200.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.200.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.200.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.201.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.201.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.201.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.202.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.202.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.202.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.203.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.203.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.203.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.204.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.204.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.204.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.205.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.205.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.205.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.206.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.206.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.206.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.207.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.207.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.207.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.208.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.208.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.208.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.209.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.209.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.209.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.210.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.210.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.210.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.211.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.211.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.211.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.212.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.212.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.212.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.213.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.213.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.213.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.214.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.214.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.214.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.215.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.215.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.215.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.216.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.216.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.216.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.217.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.217.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.217.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.218.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.218.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.218.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.219.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.219.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.219.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.220.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.220.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.220.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.221.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.221.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.221.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.222.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.222.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.222.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.223.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.223.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.223.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.224.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.224.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.224.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.225.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.225.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.225.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.226.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.226.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.226.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.227.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.227.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.227.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.228.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.228.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.228.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.229.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.229.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.229.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.230.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.230.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.230.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.231.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.231.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.231.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.232.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.232.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.232.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.233.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.233.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.233.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.234.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.234.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.234.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.235.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.235.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.235.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.236.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.236.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.236.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.237.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.237.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.237.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.238.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.238.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.238.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.239.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.239.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.239.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.240.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.240.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.240.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.241.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.241.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.241.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.242.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.242.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.242.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.243.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.243.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.243.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.244.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.244.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.244.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.245.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.245.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.245.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.246.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.246.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.246.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.247.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.247.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.247.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.248.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.248.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.248.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.249.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.249.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.249.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.250.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.250.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.250.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.251.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.251.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.251.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.252.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.252.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.252.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.253.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.253.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.253.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.254.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.254.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.254.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.255.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.255.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.255.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.input_layernorm.weight": "model-00125-of-000163.safetensors", + "model.layers.47.post_attention_layernorm.weight": "model-00125-of-000163.safetensors", + "model.layers.48.self_attn.q_a_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.self_attn.q_a_layernorm.weight": "model-00125-of-000163.safetensors", + "model.layers.48.self_attn.q_b_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.self_attn.kv_a_proj_with_mqa.weight": "model-00125-of-000163.safetensors", + "model.layers.48.self_attn.kv_a_layernorm.weight": "model-00125-of-000163.safetensors", + "model.layers.48.self_attn.kv_b_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.self_attn.o_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.gate.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.gate.e_score_correction_bias": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.shared_experts.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.shared_experts.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.shared_experts.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.0.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.0.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.0.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.1.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.1.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.1.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.2.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.2.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.2.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.3.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.3.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.3.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.4.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.4.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.4.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.5.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.5.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.5.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.6.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.6.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.6.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.7.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.7.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.7.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.8.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.8.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.8.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.9.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.9.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.9.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.10.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.10.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.10.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.11.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.11.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.11.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.12.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.12.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.12.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.13.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.13.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.13.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.14.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.14.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.14.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.15.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.15.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.15.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.16.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.16.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.16.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.17.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.17.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.17.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.18.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.18.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.18.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.19.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.19.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.19.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.20.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.20.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.20.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.21.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.21.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.21.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.22.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.22.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.22.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.23.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.23.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.23.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.24.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.24.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.24.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.25.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.25.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.25.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.26.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.26.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.26.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.27.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.27.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.27.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.28.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.28.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.28.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.29.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.29.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.29.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.30.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.30.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.30.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.31.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.31.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.31.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.32.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.32.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.32.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.33.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.33.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.33.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.34.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.34.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.34.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.35.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.35.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.35.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.36.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.36.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.36.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.37.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.37.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.37.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.38.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.38.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.38.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.39.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.39.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.39.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.40.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.40.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.40.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.41.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.41.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.41.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.42.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.42.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.42.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.43.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.43.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.43.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.44.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.44.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.44.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.45.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.45.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.45.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.46.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.46.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.46.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.47.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.47.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.47.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.48.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.48.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.48.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.49.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.49.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.49.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.50.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.50.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.50.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.51.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.51.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.51.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.52.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.52.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.52.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.53.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.53.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.53.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.54.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.54.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.54.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.55.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.55.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.55.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.56.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.56.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.56.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.57.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.57.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.57.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.58.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.58.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.58.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.59.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.59.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.59.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.60.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.60.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.60.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.61.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.61.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.61.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.62.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.62.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.62.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.63.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.63.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.63.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.64.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.64.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.64.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.65.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.65.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.65.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.66.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.66.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.66.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.67.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.67.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.67.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.68.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.68.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.68.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.69.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.69.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.69.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.70.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.70.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.70.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.71.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.71.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.71.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.72.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.72.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.72.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.73.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.73.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.73.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.74.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.74.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.74.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.75.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.75.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.75.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.76.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.76.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.76.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.77.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.77.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.77.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.78.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.78.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.78.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.79.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.79.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.79.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.80.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.80.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.80.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.81.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.81.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.81.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.82.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.82.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.82.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.83.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.83.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.83.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.84.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.84.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.84.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.85.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.85.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.85.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.86.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.86.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.86.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.87.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.87.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.87.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.88.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.88.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.88.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.89.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.89.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.89.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.90.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.90.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.90.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.91.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.91.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.91.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.92.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.92.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.92.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.93.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.93.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.93.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.94.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.94.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.94.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.95.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.95.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.95.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.96.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.96.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.96.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.97.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.97.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.97.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.98.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.98.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.98.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.99.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.99.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.99.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.100.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.100.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.100.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.101.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.101.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.101.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.102.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.102.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.102.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.103.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.103.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.103.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.104.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.104.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.104.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.105.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.105.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.105.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.106.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.106.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.106.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.107.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.107.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.107.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.108.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.108.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.108.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.109.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.109.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.109.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.110.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.110.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.110.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.111.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.111.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.111.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.112.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.112.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.112.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.113.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.113.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.113.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.114.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.114.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.114.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.115.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.115.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.115.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.116.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.116.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.116.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.117.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.117.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.117.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.118.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.118.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.118.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.119.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.119.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.119.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.120.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.120.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.120.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.121.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.121.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.121.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.122.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.122.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.122.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.123.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.123.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.123.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.124.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.124.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.124.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.125.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.125.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.125.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.126.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.126.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.126.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.127.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.127.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.127.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.128.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.128.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.128.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.129.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.129.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.129.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.130.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.130.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.130.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.131.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.131.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.131.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.132.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.132.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.132.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.133.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.133.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.133.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.134.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.134.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.134.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.135.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.135.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.135.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.136.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.136.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.136.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.137.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.137.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.137.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.138.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.138.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.138.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.139.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.139.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.139.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.140.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.140.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.140.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.141.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.141.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.141.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.142.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.142.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.142.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.143.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.143.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.143.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.144.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.144.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.144.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.145.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.145.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.145.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.146.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.146.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.146.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.147.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.147.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.147.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.148.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.148.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.148.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.149.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.149.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.149.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.150.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.150.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.150.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.151.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.151.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.151.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.152.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.152.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.152.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.153.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.153.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.153.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.154.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.154.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.154.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.155.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.155.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.155.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.156.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.156.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.156.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.157.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.157.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.157.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.158.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.158.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.158.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.159.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.159.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.159.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.160.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.160.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.160.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.161.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.161.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.161.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.162.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.162.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.162.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.163.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.163.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.163.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.164.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.164.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.164.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.165.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.165.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.165.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.166.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.166.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.166.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.167.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.167.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.167.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.168.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.168.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.168.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.169.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.169.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.169.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.170.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.170.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.170.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.171.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.171.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.171.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.172.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.172.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.172.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.173.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.173.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.173.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.174.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.174.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.174.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.175.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.175.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.175.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.176.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.176.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.176.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.177.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.177.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.177.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.178.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.178.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.178.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.179.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.179.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.179.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.180.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.180.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.180.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.181.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.181.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.181.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.182.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.182.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.182.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.183.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.183.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.183.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.184.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.184.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.184.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.185.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.185.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.185.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.186.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.186.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.186.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.187.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.187.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.187.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.188.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.188.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.188.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.189.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.189.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.189.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.190.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.190.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.190.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.191.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.191.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.191.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.192.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.192.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.192.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.193.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.193.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.193.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.194.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.194.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.194.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.195.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.195.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.195.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.196.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.196.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.196.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.197.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.197.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.197.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.198.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.198.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.198.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.199.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.199.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.199.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.200.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.200.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.200.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.201.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.201.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.201.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.202.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.202.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.202.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.203.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.203.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.203.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.204.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.204.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.204.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.205.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.205.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.205.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.206.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.206.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.206.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.207.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.207.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.207.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.208.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.208.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.208.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.209.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.209.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.209.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.210.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.210.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.210.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.211.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.211.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.211.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.212.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.212.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.212.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.213.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.213.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.213.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.214.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.214.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.214.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.215.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.215.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.215.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.216.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.216.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.216.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.217.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.217.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.217.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.218.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.218.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.218.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.219.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.219.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.219.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.220.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.220.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.220.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.221.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.221.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.221.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.222.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.222.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.222.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.223.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.223.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.223.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.224.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.224.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.224.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.225.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.225.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.225.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.226.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.226.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.226.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.227.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.227.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.227.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.228.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.228.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.228.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.229.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.229.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.229.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.230.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.230.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.230.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.231.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.231.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.231.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.232.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.232.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.232.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.233.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.233.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.233.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.234.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.234.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.234.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.235.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.235.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.235.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.236.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.236.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.236.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.237.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.237.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.237.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.238.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.238.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.238.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.239.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.239.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.239.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.240.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.240.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.240.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.241.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.241.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.241.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.242.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.242.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.242.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.243.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.243.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.243.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.244.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.244.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.244.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.245.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.245.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.245.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.246.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.246.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.246.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.247.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.247.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.247.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.248.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.248.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.248.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.249.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.249.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.249.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.250.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.250.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.250.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.251.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.251.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.251.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.252.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.252.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.252.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.253.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.253.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.253.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.254.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.254.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.254.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.255.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.255.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.255.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.input_layernorm.weight": "model-00128-of-000163.safetensors", + "model.layers.48.post_attention_layernorm.weight": "model-00128-of-000163.safetensors", + "model.layers.49.self_attn.q_a_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.self_attn.q_a_layernorm.weight": "model-00128-of-000163.safetensors", + "model.layers.49.self_attn.q_b_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.self_attn.kv_a_proj_with_mqa.weight": "model-00128-of-000163.safetensors", + "model.layers.49.self_attn.kv_a_layernorm.weight": "model-00128-of-000163.safetensors", + "model.layers.49.self_attn.kv_b_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.self_attn.o_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.gate.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.gate.e_score_correction_bias": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.shared_experts.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.shared_experts.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.shared_experts.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.0.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.0.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.0.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.1.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.1.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.1.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.2.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.2.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.2.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.3.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.3.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.3.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.4.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.4.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.4.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.5.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.5.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.5.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.6.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.6.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.6.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.7.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.7.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.7.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.8.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.8.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.8.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.9.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.9.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.9.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.10.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.10.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.10.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.11.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.11.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.11.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.12.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.12.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.12.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.13.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.13.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.13.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.14.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.14.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.14.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.15.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.15.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.15.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.16.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.16.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.16.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.17.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.17.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.17.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.18.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.18.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.18.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.19.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.19.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.19.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.20.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.20.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.20.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.21.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.21.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.21.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.22.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.22.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.22.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.23.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.23.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.23.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.24.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.24.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.24.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.25.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.25.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.25.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.26.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.26.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.26.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.27.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.27.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.27.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.28.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.28.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.28.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.29.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.29.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.29.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.30.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.30.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.30.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.31.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.31.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.31.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.32.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.32.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.32.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.33.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.33.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.33.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.34.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.34.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.34.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.35.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.35.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.35.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.36.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.36.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.36.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.37.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.37.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.37.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.38.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.38.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.38.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.39.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.39.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.39.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.40.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.40.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.40.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.41.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.41.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.41.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.42.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.42.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.42.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.43.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.43.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.43.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.44.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.44.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.44.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.45.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.45.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.45.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.46.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.46.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.46.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.47.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.47.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.47.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.48.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.48.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.48.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.49.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.49.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.49.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.50.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.50.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.50.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.51.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.51.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.51.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.52.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.52.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.52.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.53.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.53.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.53.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.54.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.54.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.54.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.55.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.55.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.55.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.56.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.56.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.56.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.57.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.57.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.57.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.58.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.58.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.58.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.59.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.59.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.59.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.60.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.60.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.60.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.61.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.61.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.61.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.62.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.62.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.62.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.63.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.63.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.63.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.64.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.64.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.64.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.65.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.65.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.65.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.66.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.66.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.66.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.67.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.67.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.67.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.68.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.68.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.68.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.69.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.69.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.69.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.70.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.70.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.70.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.71.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.71.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.71.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.72.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.72.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.72.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.73.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.73.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.73.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.74.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.74.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.74.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.75.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.75.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.75.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.76.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.76.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.76.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.77.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.77.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.77.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.78.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.78.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.78.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.79.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.79.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.79.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.80.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.80.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.80.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.81.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.81.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.81.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.82.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.82.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.82.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.83.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.83.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.83.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.84.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.84.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.84.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.85.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.85.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.85.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.86.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.86.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.86.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.87.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.87.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.87.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.88.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.88.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.88.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.89.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.89.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.89.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.90.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.90.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.90.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.91.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.91.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.91.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.92.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.92.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.92.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.93.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.93.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.93.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.94.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.94.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.94.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.95.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.95.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.95.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.96.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.96.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.96.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.97.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.97.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.97.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.98.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.98.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.98.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.99.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.99.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.99.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.100.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.100.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.100.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.101.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.101.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.101.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.102.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.102.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.102.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.103.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.103.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.103.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.104.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.104.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.104.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.105.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.105.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.105.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.106.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.106.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.106.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.107.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.107.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.107.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.108.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.108.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.108.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.109.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.109.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.109.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.110.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.110.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.110.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.111.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.111.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.111.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.112.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.112.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.112.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.113.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.113.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.113.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.114.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.114.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.114.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.115.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.115.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.115.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.116.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.116.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.116.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.117.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.117.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.117.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.118.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.118.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.118.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.119.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.119.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.119.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.120.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.120.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.120.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.121.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.121.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.121.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.122.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.122.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.122.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.123.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.123.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.123.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.124.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.124.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.124.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.125.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.125.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.125.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.126.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.126.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.126.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.127.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.127.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.127.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.128.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.128.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.128.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.129.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.129.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.129.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.130.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.130.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.130.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.131.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.131.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.131.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.132.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.132.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.132.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.133.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.133.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.133.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.134.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.134.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.134.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.135.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.135.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.135.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.136.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.136.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.136.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.137.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.137.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.137.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.138.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.138.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.138.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.139.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.139.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.139.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.140.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.140.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.140.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.141.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.141.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.141.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.142.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.142.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.142.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.143.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.143.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.143.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.144.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.144.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.144.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.145.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.145.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.145.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.146.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.146.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.146.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.147.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.147.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.147.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.148.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.148.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.148.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.149.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.149.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.149.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.150.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.150.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.150.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.151.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.151.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.151.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.152.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.152.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.152.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.153.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.153.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.153.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.154.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.154.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.154.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.155.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.155.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.155.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.156.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.156.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.156.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.157.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.157.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.157.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.158.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.158.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.158.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.159.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.159.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.159.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.160.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.160.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.160.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.161.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.161.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.161.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.162.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.162.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.162.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.163.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.163.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.163.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.164.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.164.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.164.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.165.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.165.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.165.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.166.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.166.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.166.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.167.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.167.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.167.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.168.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.168.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.168.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.169.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.169.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.169.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.170.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.170.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.170.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.171.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.171.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.171.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.172.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.172.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.172.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.173.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.173.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.173.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.174.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.174.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.174.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.175.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.175.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.175.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.176.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.176.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.176.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.177.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.177.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.177.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.178.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.178.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.178.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.179.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.179.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.179.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.180.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.180.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.180.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.181.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.181.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.181.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.182.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.182.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.182.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.183.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.183.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.183.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.184.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.184.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.184.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.185.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.185.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.185.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.186.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.186.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.186.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.187.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.187.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.187.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.188.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.188.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.188.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.189.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.189.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.189.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.190.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.190.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.190.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.191.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.191.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.191.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.192.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.192.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.192.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.193.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.193.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.193.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.194.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.194.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.194.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.195.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.195.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.195.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.196.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.196.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.196.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.197.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.197.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.197.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.198.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.198.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.198.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.199.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.199.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.199.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.200.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.200.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.200.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.201.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.201.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.201.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.202.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.202.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.202.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.203.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.203.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.203.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.204.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.204.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.204.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.205.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.205.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.205.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.206.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.206.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.206.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.207.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.207.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.207.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.208.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.208.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.208.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.209.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.209.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.209.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.210.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.210.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.210.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.211.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.211.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.211.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.212.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.212.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.212.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.213.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.213.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.213.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.214.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.214.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.214.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.215.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.215.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.215.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.216.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.216.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.216.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.217.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.217.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.217.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.218.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.218.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.218.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.219.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.219.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.219.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.220.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.220.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.220.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.221.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.221.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.221.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.222.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.222.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.222.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.223.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.223.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.223.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.224.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.224.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.224.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.225.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.225.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.225.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.226.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.226.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.226.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.227.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.227.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.227.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.228.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.228.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.228.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.229.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.229.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.229.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.230.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.230.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.230.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.231.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.231.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.231.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.232.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.232.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.232.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.233.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.233.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.233.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.234.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.234.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.234.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.235.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.235.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.235.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.236.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.236.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.236.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.237.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.237.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.237.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.238.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.238.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.238.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.239.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.239.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.239.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.240.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.240.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.240.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.241.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.241.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.241.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.242.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.242.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.242.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.243.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.243.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.243.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.244.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.244.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.244.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.245.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.245.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.245.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.246.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.246.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.246.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.247.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.247.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.247.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.248.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.248.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.248.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.249.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.249.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.249.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.250.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.250.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.250.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.251.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.251.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.251.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.252.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.252.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.252.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.253.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.253.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.49.mlp.experts.253.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.49.mlp.experts.254.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.49.mlp.experts.254.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.49.mlp.experts.254.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.49.mlp.experts.255.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.49.mlp.experts.255.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.49.mlp.experts.255.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.49.input_layernorm.weight": "model-00131-of-000163.safetensors", + "model.layers.49.post_attention_layernorm.weight": "model-00131-of-000163.safetensors", + "model.layers.50.self_attn.q_a_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.self_attn.q_a_layernorm.weight": "model-00131-of-000163.safetensors", + "model.layers.50.self_attn.q_b_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.self_attn.kv_a_proj_with_mqa.weight": "model-00131-of-000163.safetensors", + "model.layers.50.self_attn.kv_a_layernorm.weight": "model-00131-of-000163.safetensors", + "model.layers.50.self_attn.kv_b_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.self_attn.o_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.gate.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.gate.e_score_correction_bias": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.shared_experts.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.shared_experts.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.shared_experts.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.0.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.0.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.0.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.1.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.1.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.1.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.2.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.2.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.2.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.3.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.3.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.3.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.4.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.4.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.4.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.5.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.5.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.5.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.6.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.6.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.6.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.7.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.7.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.7.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.8.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.8.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.8.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.9.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.9.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.9.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.10.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.10.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.10.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.11.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.11.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.11.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.12.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.12.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.12.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.13.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.13.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.13.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.14.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.14.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.14.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.15.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.15.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.15.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.16.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.16.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.16.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.17.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.17.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.17.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.18.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.18.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.18.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.19.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.19.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.19.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.20.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.20.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.20.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.21.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.21.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.21.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.22.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.22.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.22.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.23.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.23.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.23.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.24.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.24.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.24.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.25.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.25.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.25.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.26.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.26.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.26.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.27.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.27.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.27.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.28.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.28.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.28.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.29.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.29.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.29.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.30.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.30.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.30.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.31.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.31.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.31.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.32.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.32.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.32.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.33.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.33.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.33.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.34.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.34.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.34.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.35.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.35.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.35.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.36.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.36.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.36.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.37.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.37.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.37.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.38.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.38.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.38.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.39.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.39.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.39.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.40.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.40.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.40.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.41.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.41.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.41.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.42.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.42.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.42.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.43.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.43.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.43.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.44.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.44.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.44.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.45.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.45.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.45.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.46.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.46.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.46.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.47.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.47.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.47.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.48.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.48.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.48.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.49.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.49.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.49.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.50.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.50.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.50.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.51.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.51.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.51.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.52.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.52.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.52.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.53.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.53.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.53.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.54.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.54.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.54.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.55.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.55.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.55.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.56.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.56.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.56.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.57.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.57.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.57.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.58.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.58.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.58.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.59.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.59.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.59.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.60.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.60.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.60.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.61.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.61.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.61.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.62.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.62.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.62.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.63.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.63.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.63.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.64.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.64.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.64.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.65.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.65.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.65.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.66.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.66.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.66.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.67.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.67.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.67.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.68.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.68.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.68.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.69.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.69.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.69.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.70.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.70.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.70.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.71.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.71.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.71.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.72.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.72.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.72.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.73.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.73.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.73.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.74.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.74.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.74.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.75.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.75.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.75.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.76.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.76.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.76.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.77.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.77.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.77.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.78.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.78.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.78.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.79.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.79.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.79.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.80.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.80.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.80.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.81.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.81.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.81.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.82.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.82.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.82.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.83.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.83.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.83.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.84.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.84.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.84.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.85.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.85.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.85.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.86.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.86.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.86.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.87.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.87.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.87.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.88.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.88.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.88.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.89.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.89.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.89.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.90.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.90.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.90.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.91.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.91.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.91.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.92.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.92.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.92.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.93.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.93.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.93.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.94.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.94.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.94.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.95.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.95.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.95.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.96.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.96.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.96.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.97.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.97.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.97.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.98.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.98.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.98.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.99.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.99.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.99.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.100.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.100.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.100.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.101.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.101.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.101.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.102.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.102.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.102.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.103.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.103.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.103.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.104.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.104.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.104.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.105.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.105.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.105.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.106.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.106.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.106.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.107.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.107.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.107.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.108.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.108.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.108.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.109.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.109.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.109.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.110.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.110.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.110.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.111.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.111.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.111.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.112.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.112.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.112.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.113.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.113.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.113.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.114.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.114.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.114.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.115.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.115.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.115.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.116.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.116.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.116.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.117.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.117.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.117.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.118.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.118.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.118.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.119.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.119.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.119.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.120.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.120.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.120.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.121.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.121.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.121.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.122.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.122.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.122.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.123.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.123.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.123.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.124.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.124.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.124.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.125.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.125.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.125.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.126.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.126.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.126.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.127.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.127.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.127.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.128.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.128.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.128.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.129.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.129.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.129.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.130.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.130.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.130.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.131.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.131.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.131.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.132.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.132.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.132.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.133.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.133.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.133.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.134.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.134.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.134.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.135.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.135.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.135.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.136.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.136.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.136.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.137.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.137.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.137.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.138.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.138.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.138.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.139.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.139.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.139.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.140.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.140.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.140.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.141.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.141.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.141.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.142.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.142.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.142.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.143.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.143.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.143.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.144.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.144.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.144.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.145.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.145.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.145.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.146.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.146.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.146.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.147.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.147.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.147.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.148.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.148.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.148.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.149.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.149.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.149.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.150.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.150.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.150.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.151.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.151.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.151.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.152.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.152.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.152.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.153.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.153.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.153.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.154.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.154.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.154.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.155.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.155.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.155.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.156.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.156.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.156.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.157.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.157.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.157.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.158.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.158.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.158.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.159.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.159.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.159.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.160.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.160.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.160.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.161.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.161.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.161.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.162.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.162.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.162.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.163.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.163.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.163.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.164.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.164.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.164.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.165.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.165.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.165.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.166.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.166.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.166.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.167.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.167.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.167.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.168.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.168.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.168.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.169.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.169.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.169.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.170.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.170.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.170.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.171.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.171.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.171.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.172.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.172.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.172.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.173.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.173.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.173.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.174.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.174.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.174.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.175.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.175.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.175.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.176.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.176.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.176.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.177.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.177.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.177.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.178.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.178.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.178.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.179.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.179.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.179.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.180.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.180.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.180.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.181.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.181.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.181.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.182.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.182.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.182.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.183.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.183.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.183.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.184.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.184.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.184.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.185.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.185.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.185.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.186.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.186.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.186.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.187.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.187.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.187.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.188.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.188.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.188.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.189.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.189.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.189.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.190.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.190.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.190.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.191.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.191.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.191.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.192.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.192.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.192.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.193.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.193.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.193.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.194.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.194.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.194.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.195.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.195.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.195.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.196.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.196.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.196.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.197.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.197.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.197.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.198.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.198.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.198.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.199.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.199.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.199.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.200.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.200.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.200.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.201.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.201.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.201.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.202.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.202.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.202.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.203.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.203.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.203.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.204.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.204.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.204.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.205.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.205.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.205.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.206.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.206.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.206.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.207.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.207.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.207.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.208.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.208.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.208.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.209.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.209.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.209.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.210.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.210.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.210.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.211.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.211.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.211.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.212.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.212.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.212.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.213.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.213.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.213.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.214.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.214.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.214.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.215.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.215.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.215.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.216.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.216.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.216.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.217.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.217.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.217.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.218.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.218.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.218.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.219.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.219.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.219.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.220.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.220.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.220.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.221.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.221.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.221.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.222.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.222.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.222.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.223.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.223.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.223.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.224.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.224.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.224.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.225.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.225.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.225.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.226.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.226.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.226.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.227.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.227.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.227.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.228.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.228.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.228.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.229.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.229.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.229.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.230.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.230.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.230.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.231.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.231.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.231.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.232.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.232.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.232.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.233.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.233.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.233.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.234.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.234.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.234.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.235.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.235.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.235.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.236.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.236.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.236.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.237.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.237.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.237.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.238.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.238.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.238.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.239.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.239.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.239.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.240.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.240.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.240.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.241.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.241.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.241.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.242.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.242.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.242.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.243.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.243.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.243.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.244.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.244.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.244.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.245.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.245.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.245.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.246.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.246.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.246.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.247.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.247.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.247.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.248.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.248.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.248.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.249.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.249.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.249.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.250.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.250.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.250.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.251.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.251.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.251.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.252.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.252.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.252.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.253.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.253.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.253.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.254.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.254.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.254.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.255.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.255.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.255.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.input_layernorm.weight": "model-00133-of-000163.safetensors", + "model.layers.50.post_attention_layernorm.weight": "model-00133-of-000163.safetensors", + "model.layers.51.self_attn.q_a_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.self_attn.q_a_layernorm.weight": "model-00133-of-000163.safetensors", + "model.layers.51.self_attn.q_b_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.self_attn.kv_a_proj_with_mqa.weight": "model-00133-of-000163.safetensors", + "model.layers.51.self_attn.kv_a_layernorm.weight": "model-00133-of-000163.safetensors", + "model.layers.51.self_attn.kv_b_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.self_attn.o_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.gate.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.gate.e_score_correction_bias": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.shared_experts.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.shared_experts.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.shared_experts.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.0.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.0.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.0.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.1.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.1.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.1.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.2.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.2.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.2.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.3.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.3.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.3.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.4.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.4.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.4.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.5.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.5.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.5.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.6.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.6.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.6.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.7.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.7.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.7.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.8.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.8.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.8.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.9.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.9.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.9.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.10.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.10.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.10.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.11.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.11.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.11.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.12.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.12.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.12.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.13.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.13.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.13.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.14.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.14.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.14.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.15.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.15.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.15.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.16.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.16.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.16.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.17.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.17.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.17.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.18.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.18.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.18.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.19.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.19.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.19.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.20.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.20.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.20.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.21.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.21.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.21.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.22.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.22.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.22.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.23.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.23.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.23.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.24.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.24.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.24.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.25.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.25.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.25.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.26.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.26.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.26.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.27.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.27.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.27.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.28.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.28.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.28.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.29.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.29.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.29.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.30.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.30.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.30.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.31.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.31.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.31.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.32.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.32.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.32.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.33.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.33.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.33.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.34.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.34.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.34.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.35.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.35.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.35.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.36.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.36.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.36.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.37.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.37.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.37.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.38.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.38.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.38.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.39.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.39.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.39.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.40.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.40.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.40.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.41.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.41.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.41.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.42.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.42.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.42.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.43.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.43.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.43.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.44.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.44.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.44.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.45.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.45.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.45.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.46.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.46.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.46.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.47.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.47.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.47.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.48.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.48.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.48.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.49.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.49.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.49.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.50.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.50.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.50.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.51.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.51.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.51.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.52.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.52.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.52.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.53.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.53.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.53.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.54.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.54.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.54.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.55.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.55.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.55.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.56.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.56.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.56.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.57.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.57.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.57.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.58.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.58.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.58.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.59.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.59.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.59.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.60.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.60.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.60.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.61.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.61.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.61.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.62.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.62.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.62.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.63.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.63.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.63.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.64.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.64.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.64.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.65.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.65.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.65.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.66.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.66.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.66.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.67.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.67.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.67.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.68.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.68.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.68.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.69.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.69.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.69.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.70.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.70.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.70.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.71.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.71.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.71.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.72.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.72.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.72.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.73.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.73.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.73.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.74.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.74.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.74.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.75.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.75.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.75.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.76.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.76.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.76.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.77.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.77.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.77.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.78.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.78.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.78.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.79.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.79.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.79.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.80.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.80.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.80.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.81.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.81.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.81.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.82.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.82.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.82.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.83.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.83.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.83.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.84.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.84.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.84.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.85.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.85.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.85.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.86.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.86.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.86.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.87.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.87.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.87.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.88.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.88.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.88.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.89.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.89.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.89.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.90.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.90.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.90.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.91.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.91.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.91.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.92.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.92.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.92.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.93.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.93.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.93.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.94.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.94.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.94.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.95.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.95.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.95.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.96.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.96.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.96.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.97.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.97.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.97.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.98.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.98.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.98.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.99.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.99.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.99.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.100.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.100.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.100.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.101.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.101.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.101.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.102.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.102.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.102.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.103.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.103.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.103.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.104.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.104.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.104.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.105.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.105.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.105.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.106.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.106.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.106.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.107.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.107.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.107.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.108.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.108.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.108.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.109.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.109.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.109.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.110.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.110.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.110.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.111.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.111.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.111.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.112.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.112.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.112.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.113.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.113.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.113.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.114.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.114.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.114.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.115.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.115.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.115.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.116.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.116.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.116.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.117.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.117.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.117.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.118.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.118.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.118.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.119.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.119.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.119.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.120.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.120.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.120.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.121.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.121.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.121.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.122.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.122.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.122.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.123.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.123.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.123.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.124.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.124.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.124.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.125.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.125.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.125.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.126.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.126.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.126.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.127.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.127.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.127.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.128.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.128.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.128.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.129.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.129.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.129.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.130.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.130.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.130.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.131.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.131.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.131.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.132.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.132.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.132.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.133.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.133.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.133.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.134.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.134.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.134.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.135.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.135.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.135.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.136.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.136.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.136.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.137.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.137.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.137.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.138.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.138.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.138.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.139.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.139.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.139.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.140.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.140.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.140.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.141.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.141.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.141.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.142.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.142.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.142.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.143.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.143.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.143.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.144.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.144.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.144.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.145.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.145.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.145.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.146.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.146.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.146.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.147.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.147.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.147.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.148.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.148.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.148.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.149.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.149.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.149.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.150.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.150.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.150.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.151.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.151.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.151.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.152.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.152.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.152.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.153.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.153.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.153.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.154.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.154.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.154.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.155.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.155.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.155.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.156.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.156.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.156.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.157.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.157.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.157.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.158.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.158.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.158.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.159.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.159.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.159.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.160.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.160.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.160.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.161.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.161.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.161.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.162.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.162.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.162.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.163.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.163.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.163.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.164.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.164.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.164.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.165.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.165.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.165.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.166.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.166.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.166.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.167.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.167.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.167.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.168.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.168.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.168.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.169.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.169.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.169.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.170.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.170.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.170.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.171.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.171.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.171.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.172.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.172.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.172.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.173.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.173.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.173.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.174.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.174.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.174.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.175.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.175.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.175.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.176.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.176.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.176.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.177.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.177.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.177.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.178.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.178.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.178.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.179.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.179.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.179.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.180.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.180.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.180.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.181.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.181.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.181.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.182.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.182.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.182.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.183.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.183.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.183.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.184.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.184.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.184.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.185.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.185.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.185.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.186.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.186.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.186.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.187.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.187.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.187.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.188.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.188.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.188.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.189.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.189.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.189.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.190.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.190.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.190.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.191.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.191.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.191.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.192.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.192.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.192.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.193.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.193.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.193.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.194.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.194.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.194.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.195.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.195.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.195.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.196.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.196.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.196.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.197.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.197.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.197.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.198.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.198.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.198.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.199.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.199.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.199.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.200.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.200.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.200.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.201.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.201.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.201.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.202.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.202.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.202.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.203.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.203.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.203.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.204.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.204.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.204.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.205.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.205.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.205.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.206.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.206.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.206.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.207.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.207.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.207.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.208.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.208.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.208.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.209.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.209.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.209.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.210.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.210.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.210.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.211.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.211.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.211.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.212.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.212.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.212.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.213.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.213.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.213.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.214.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.214.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.214.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.215.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.215.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.215.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.216.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.216.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.216.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.217.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.217.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.217.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.218.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.218.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.218.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.219.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.219.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.219.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.220.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.220.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.220.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.221.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.221.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.221.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.222.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.222.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.222.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.223.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.223.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.223.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.224.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.224.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.224.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.225.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.225.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.225.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.226.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.226.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.226.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.227.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.227.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.227.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.228.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.228.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.228.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.229.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.229.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.229.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.230.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.230.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.230.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.231.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.231.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.231.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.232.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.232.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.232.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.233.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.233.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.233.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.234.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.234.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.234.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.235.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.235.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.235.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.236.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.236.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.236.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.237.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.237.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.237.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.238.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.238.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.238.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.239.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.239.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.239.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.240.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.240.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.240.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.241.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.241.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.241.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.242.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.242.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.242.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.243.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.243.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.243.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.244.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.244.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.244.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.245.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.245.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.245.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.246.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.246.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.246.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.247.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.247.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.247.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.248.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.248.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.248.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.249.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.249.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.249.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.250.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.250.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.250.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.251.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.251.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.251.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.252.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.252.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.252.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.253.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.253.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.253.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.254.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.254.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.254.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.255.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.255.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.255.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.input_layernorm.weight": "model-00136-of-000163.safetensors", + "model.layers.51.post_attention_layernorm.weight": "model-00136-of-000163.safetensors", + "model.layers.52.self_attn.q_a_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.self_attn.q_a_layernorm.weight": "model-00136-of-000163.safetensors", + "model.layers.52.self_attn.q_b_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.self_attn.kv_a_proj_with_mqa.weight": "model-00136-of-000163.safetensors", + "model.layers.52.self_attn.kv_a_layernorm.weight": "model-00136-of-000163.safetensors", + "model.layers.52.self_attn.kv_b_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.self_attn.o_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.gate.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.gate.e_score_correction_bias": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.shared_experts.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.shared_experts.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.shared_experts.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.0.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.0.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.0.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.1.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.1.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.1.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.2.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.2.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.2.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.3.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.3.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.3.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.4.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.4.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.4.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.5.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.5.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.5.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.6.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.6.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.6.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.7.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.7.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.7.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.8.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.8.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.8.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.9.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.9.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.9.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.10.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.10.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.10.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.11.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.11.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.11.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.12.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.12.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.12.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.13.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.13.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.13.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.14.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.14.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.14.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.15.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.15.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.15.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.16.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.16.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.16.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.17.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.17.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.17.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.18.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.18.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.18.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.19.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.19.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.19.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.20.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.20.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.20.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.21.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.21.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.21.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.22.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.22.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.22.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.23.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.23.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.23.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.24.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.24.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.24.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.25.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.25.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.25.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.26.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.26.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.26.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.27.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.27.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.27.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.28.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.28.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.28.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.29.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.29.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.29.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.30.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.30.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.30.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.31.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.31.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.31.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.32.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.32.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.32.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.33.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.33.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.33.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.34.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.34.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.34.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.35.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.35.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.35.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.36.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.36.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.36.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.37.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.37.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.37.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.38.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.38.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.38.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.39.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.39.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.39.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.40.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.40.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.40.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.41.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.41.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.41.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.42.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.42.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.42.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.43.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.43.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.43.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.44.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.44.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.44.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.45.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.45.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.45.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.46.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.46.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.46.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.47.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.47.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.47.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.48.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.48.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.48.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.49.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.49.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.49.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.50.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.50.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.50.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.51.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.51.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.51.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.52.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.52.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.52.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.53.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.53.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.53.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.54.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.54.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.54.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.55.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.55.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.55.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.56.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.56.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.56.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.57.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.57.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.57.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.58.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.58.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.58.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.59.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.59.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.59.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.60.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.60.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.60.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.61.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.61.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.61.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.62.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.62.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.62.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.63.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.63.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.63.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.64.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.64.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.64.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.65.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.65.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.65.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.66.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.66.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.66.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.67.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.67.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.67.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.68.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.68.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.68.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.69.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.69.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.69.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.70.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.70.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.70.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.71.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.71.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.71.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.72.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.72.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.72.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.73.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.73.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.73.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.74.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.74.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.74.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.75.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.75.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.75.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.76.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.76.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.76.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.77.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.77.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.77.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.78.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.78.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.78.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.79.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.79.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.79.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.80.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.80.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.80.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.81.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.81.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.81.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.82.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.82.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.82.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.83.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.83.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.83.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.84.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.84.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.84.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.85.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.85.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.85.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.86.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.86.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.86.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.87.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.87.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.87.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.88.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.88.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.88.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.89.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.89.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.89.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.90.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.90.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.90.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.91.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.91.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.91.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.92.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.92.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.92.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.93.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.93.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.93.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.94.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.94.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.94.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.95.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.95.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.95.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.96.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.96.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.96.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.97.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.97.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.97.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.98.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.98.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.98.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.99.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.99.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.99.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.100.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.100.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.100.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.101.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.101.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.101.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.102.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.102.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.102.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.103.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.103.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.103.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.104.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.104.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.104.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.105.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.105.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.105.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.106.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.106.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.106.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.107.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.107.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.107.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.108.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.108.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.108.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.109.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.109.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.109.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.110.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.110.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.110.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.111.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.111.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.111.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.112.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.112.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.112.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.113.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.113.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.113.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.114.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.114.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.114.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.115.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.115.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.115.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.116.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.116.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.116.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.117.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.117.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.117.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.118.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.118.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.118.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.119.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.119.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.119.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.120.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.120.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.120.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.121.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.121.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.121.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.122.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.122.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.122.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.123.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.123.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.123.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.124.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.124.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.124.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.125.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.125.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.125.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.126.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.126.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.126.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.127.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.127.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.127.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.128.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.128.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.128.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.129.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.129.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.129.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.130.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.130.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.130.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.131.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.131.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.131.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.132.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.132.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.132.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.133.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.133.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.133.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.134.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.134.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.134.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.135.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.135.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.135.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.136.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.136.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.136.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.137.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.137.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.137.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.138.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.138.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.138.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.139.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.139.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.139.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.140.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.140.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.140.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.141.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.141.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.141.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.142.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.142.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.142.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.143.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.143.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.143.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.144.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.144.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.144.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.145.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.145.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.145.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.146.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.146.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.146.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.147.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.147.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.147.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.148.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.148.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.148.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.149.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.149.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.149.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.150.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.150.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.150.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.151.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.151.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.151.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.152.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.152.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.152.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.153.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.153.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.153.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.154.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.154.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.154.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.155.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.155.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.155.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.156.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.156.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.156.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.157.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.157.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.157.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.158.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.158.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.158.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.159.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.159.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.159.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.160.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.160.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.160.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.161.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.161.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.161.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.162.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.162.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.162.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.163.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.163.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.163.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.164.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.164.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.164.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.165.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.165.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.165.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.166.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.166.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.166.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.167.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.167.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.167.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.168.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.168.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.168.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.169.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.169.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.169.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.170.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.170.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.170.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.171.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.171.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.171.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.172.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.172.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.172.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.173.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.173.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.173.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.174.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.174.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.174.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.175.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.175.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.175.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.176.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.176.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.176.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.177.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.177.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.177.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.178.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.178.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.178.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.179.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.179.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.179.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.180.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.180.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.180.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.181.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.181.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.181.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.182.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.182.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.182.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.183.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.183.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.183.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.184.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.184.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.184.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.185.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.185.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.185.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.186.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.186.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.186.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.187.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.187.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.187.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.188.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.188.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.188.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.189.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.189.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.189.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.190.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.190.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.190.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.191.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.191.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.191.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.192.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.192.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.192.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.193.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.193.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.193.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.194.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.194.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.194.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.195.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.195.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.195.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.196.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.196.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.196.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.197.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.197.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.197.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.198.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.198.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.198.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.199.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.199.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.199.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.200.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.200.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.200.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.201.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.201.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.201.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.202.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.202.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.202.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.203.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.203.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.203.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.204.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.204.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.204.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.205.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.205.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.205.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.206.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.206.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.206.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.207.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.207.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.207.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.208.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.208.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.208.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.209.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.209.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.209.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.210.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.210.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.210.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.211.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.211.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.211.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.212.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.212.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.212.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.213.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.213.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.213.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.214.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.214.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.214.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.215.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.215.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.215.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.216.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.216.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.216.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.217.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.217.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.217.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.218.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.218.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.218.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.219.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.219.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.219.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.220.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.220.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.220.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.221.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.221.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.221.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.222.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.222.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.222.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.223.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.223.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.223.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.224.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.224.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.224.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.225.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.225.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.225.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.226.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.226.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.226.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.227.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.227.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.227.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.228.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.228.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.228.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.229.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.229.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.229.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.230.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.230.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.230.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.231.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.231.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.231.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.232.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.232.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.232.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.233.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.233.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.233.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.234.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.234.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.234.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.235.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.235.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.235.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.236.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.236.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.236.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.237.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.237.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.237.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.238.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.238.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.238.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.239.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.239.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.239.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.240.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.240.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.240.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.241.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.241.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.241.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.242.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.242.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.242.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.243.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.243.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.243.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.244.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.244.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.244.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.245.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.245.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.245.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.246.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.246.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.246.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.247.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.247.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.247.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.248.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.248.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.248.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.249.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.249.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.249.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.250.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.250.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.250.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.251.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.251.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.251.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.252.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.252.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.252.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.253.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.253.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.253.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.254.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.254.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.254.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.255.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.255.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.255.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.input_layernorm.weight": "model-00139-of-000163.safetensors", + "model.layers.52.post_attention_layernorm.weight": "model-00139-of-000163.safetensors", + "model.layers.53.self_attn.q_a_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.self_attn.q_a_layernorm.weight": "model-00139-of-000163.safetensors", + "model.layers.53.self_attn.q_b_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.self_attn.kv_a_proj_with_mqa.weight": "model-00139-of-000163.safetensors", + "model.layers.53.self_attn.kv_a_layernorm.weight": "model-00139-of-000163.safetensors", + "model.layers.53.self_attn.kv_b_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.self_attn.o_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.gate.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.gate.e_score_correction_bias": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.shared_experts.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.shared_experts.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.shared_experts.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.0.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.0.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.0.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.1.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.1.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.1.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.2.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.2.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.2.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.3.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.3.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.3.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.4.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.4.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.4.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.5.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.5.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.5.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.6.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.6.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.6.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.7.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.7.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.7.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.8.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.8.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.8.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.9.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.9.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.9.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.10.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.10.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.10.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.11.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.11.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.11.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.12.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.12.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.12.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.13.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.13.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.13.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.14.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.14.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.14.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.15.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.15.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.15.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.16.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.16.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.16.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.17.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.17.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.17.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.18.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.18.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.18.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.19.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.19.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.19.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.20.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.20.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.20.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.21.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.21.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.21.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.22.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.22.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.22.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.23.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.23.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.23.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.24.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.24.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.24.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.25.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.25.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.25.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.26.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.26.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.26.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.27.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.27.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.27.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.28.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.28.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.28.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.29.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.29.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.29.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.30.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.30.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.30.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.31.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.31.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.31.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.32.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.32.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.32.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.33.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.33.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.33.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.34.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.34.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.34.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.35.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.35.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.35.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.36.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.36.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.36.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.37.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.37.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.37.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.38.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.38.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.38.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.39.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.39.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.39.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.40.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.40.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.40.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.41.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.41.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.41.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.42.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.42.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.42.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.43.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.43.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.43.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.44.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.44.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.44.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.45.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.45.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.45.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.46.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.46.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.46.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.47.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.47.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.47.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.48.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.48.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.48.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.49.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.49.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.49.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.50.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.50.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.50.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.51.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.51.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.51.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.52.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.52.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.52.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.53.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.53.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.53.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.54.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.54.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.54.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.55.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.55.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.55.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.56.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.56.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.56.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.57.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.57.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.57.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.58.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.58.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.58.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.59.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.59.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.59.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.60.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.60.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.60.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.61.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.61.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.61.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.62.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.62.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.62.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.63.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.63.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.63.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.64.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.64.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.64.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.65.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.65.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.65.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.66.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.66.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.66.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.67.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.67.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.67.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.68.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.68.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.68.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.69.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.69.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.69.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.70.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.70.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.70.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.71.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.71.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.71.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.72.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.72.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.72.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.73.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.73.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.73.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.74.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.74.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.74.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.75.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.75.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.75.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.76.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.76.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.76.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.77.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.77.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.77.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.78.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.78.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.78.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.79.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.79.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.79.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.80.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.80.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.80.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.81.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.81.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.81.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.82.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.82.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.82.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.83.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.83.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.83.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.84.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.84.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.84.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.85.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.85.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.85.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.86.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.86.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.86.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.87.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.87.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.87.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.88.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.88.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.88.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.89.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.89.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.89.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.90.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.90.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.90.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.91.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.91.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.91.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.92.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.92.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.92.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.93.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.93.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.93.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.94.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.94.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.94.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.95.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.95.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.95.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.96.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.96.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.96.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.97.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.97.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.97.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.98.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.98.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.98.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.99.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.99.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.99.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.100.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.100.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.100.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.101.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.101.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.101.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.102.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.102.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.102.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.103.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.103.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.103.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.104.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.104.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.104.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.105.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.105.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.105.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.106.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.106.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.106.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.107.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.107.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.107.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.108.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.108.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.108.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.109.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.109.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.109.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.110.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.110.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.110.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.111.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.111.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.111.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.112.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.112.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.112.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.113.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.113.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.113.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.114.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.114.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.114.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.115.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.115.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.115.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.116.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.116.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.116.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.117.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.117.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.117.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.118.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.118.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.118.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.119.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.119.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.119.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.120.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.120.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.120.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.121.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.121.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.121.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.122.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.122.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.122.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.123.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.123.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.123.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.124.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.124.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.124.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.125.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.125.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.125.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.126.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.126.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.126.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.127.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.127.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.127.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.128.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.128.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.128.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.129.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.129.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.129.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.130.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.130.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.130.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.131.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.131.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.131.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.132.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.132.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.132.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.133.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.133.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.133.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.134.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.134.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.134.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.135.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.135.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.135.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.136.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.136.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.136.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.137.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.137.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.137.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.138.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.138.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.138.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.139.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.139.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.139.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.140.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.140.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.140.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.141.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.141.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.141.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.142.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.142.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.142.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.143.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.143.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.143.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.144.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.144.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.144.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.145.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.145.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.145.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.146.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.146.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.146.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.147.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.147.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.147.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.148.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.148.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.148.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.149.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.149.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.149.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.150.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.150.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.150.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.151.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.151.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.151.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.152.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.152.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.152.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.153.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.153.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.153.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.154.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.154.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.154.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.155.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.155.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.155.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.156.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.156.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.156.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.157.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.157.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.157.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.158.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.158.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.158.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.159.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.159.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.159.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.160.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.160.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.160.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.161.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.161.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.161.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.162.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.162.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.162.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.163.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.163.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.163.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.164.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.164.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.164.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.165.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.165.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.165.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.166.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.166.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.166.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.167.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.167.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.167.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.168.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.168.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.168.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.169.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.169.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.169.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.170.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.170.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.170.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.171.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.171.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.171.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.172.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.172.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.172.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.173.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.173.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.173.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.174.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.174.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.174.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.175.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.175.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.175.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.176.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.176.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.176.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.177.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.177.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.177.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.178.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.178.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.178.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.179.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.179.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.179.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.180.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.180.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.180.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.181.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.181.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.181.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.182.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.182.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.182.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.183.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.183.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.183.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.184.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.184.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.184.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.185.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.185.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.185.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.186.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.186.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.186.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.187.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.187.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.187.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.188.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.188.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.188.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.189.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.189.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.189.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.190.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.190.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.190.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.191.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.191.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.191.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.192.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.192.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.192.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.193.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.193.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.193.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.194.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.194.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.194.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.195.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.195.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.195.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.196.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.196.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.196.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.197.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.197.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.197.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.198.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.198.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.198.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.199.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.199.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.199.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.200.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.200.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.200.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.201.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.201.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.201.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.202.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.202.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.202.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.203.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.203.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.203.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.204.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.204.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.204.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.205.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.205.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.205.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.206.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.206.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.206.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.207.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.207.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.207.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.208.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.208.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.208.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.209.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.209.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.209.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.210.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.210.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.210.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.211.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.211.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.211.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.212.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.212.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.212.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.213.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.213.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.213.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.214.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.214.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.214.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.215.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.215.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.215.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.216.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.216.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.216.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.217.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.217.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.217.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.218.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.218.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.218.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.219.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.219.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.219.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.220.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.220.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.220.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.221.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.221.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.221.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.222.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.222.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.222.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.223.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.223.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.223.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.224.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.224.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.224.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.225.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.225.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.225.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.226.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.226.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.226.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.227.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.227.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.227.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.228.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.228.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.228.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.229.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.229.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.229.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.230.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.230.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.230.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.231.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.231.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.231.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.232.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.232.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.232.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.233.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.233.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.233.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.234.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.234.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.234.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.235.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.235.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.235.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.236.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.236.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.236.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.237.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.237.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.237.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.238.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.238.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.238.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.239.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.239.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.239.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.240.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.240.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.240.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.241.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.241.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.241.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.242.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.242.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.242.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.243.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.243.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.243.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.244.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.244.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.244.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.245.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.245.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.245.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.246.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.246.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.246.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.247.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.247.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.247.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.248.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.248.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.248.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.249.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.249.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.249.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.250.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.250.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.250.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.251.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.251.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.251.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.252.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.252.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.252.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.253.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.253.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.253.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.254.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.254.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.254.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.255.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.255.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.255.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.input_layernorm.weight": "model-00141-of-000163.safetensors", + "model.layers.53.post_attention_layernorm.weight": "model-00141-of-000163.safetensors", + "model.layers.54.self_attn.q_a_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.self_attn.q_a_layernorm.weight": "model-00142-of-000163.safetensors", + "model.layers.54.self_attn.q_b_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.self_attn.kv_a_proj_with_mqa.weight": "model-00142-of-000163.safetensors", + "model.layers.54.self_attn.kv_a_layernorm.weight": "model-00142-of-000163.safetensors", + "model.layers.54.self_attn.kv_b_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.self_attn.o_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.gate.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.gate.e_score_correction_bias": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.shared_experts.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.shared_experts.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.shared_experts.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.0.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.0.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.0.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.1.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.1.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.1.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.2.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.2.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.2.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.3.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.3.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.3.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.4.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.4.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.4.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.5.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.5.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.5.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.6.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.6.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.6.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.7.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.7.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.7.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.8.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.8.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.8.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.9.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.9.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.9.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.10.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.10.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.10.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.11.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.11.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.11.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.12.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.12.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.12.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.13.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.13.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.13.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.14.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.14.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.14.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.15.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.15.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.15.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.16.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.16.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.16.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.17.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.17.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.17.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.18.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.18.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.18.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.19.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.19.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.19.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.20.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.20.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.20.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.21.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.21.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.21.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.22.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.22.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.22.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.23.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.23.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.23.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.24.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.24.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.24.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.25.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.25.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.25.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.26.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.26.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.26.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.27.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.27.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.27.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.28.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.28.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.28.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.29.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.29.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.29.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.30.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.30.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.30.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.31.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.31.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.31.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.32.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.32.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.32.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.33.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.33.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.33.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.34.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.34.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.34.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.35.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.35.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.35.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.36.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.36.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.36.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.37.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.37.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.37.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.38.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.38.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.38.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.39.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.39.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.39.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.40.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.40.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.40.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.41.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.41.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.41.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.42.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.42.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.42.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.43.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.43.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.43.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.44.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.44.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.44.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.45.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.45.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.45.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.46.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.46.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.46.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.47.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.47.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.47.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.48.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.48.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.48.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.49.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.49.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.49.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.50.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.50.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.50.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.51.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.51.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.51.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.52.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.52.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.52.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.53.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.53.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.53.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.54.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.54.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.54.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.55.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.55.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.55.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.56.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.56.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.56.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.57.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.57.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.57.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.58.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.58.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.58.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.59.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.59.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.59.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.60.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.60.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.60.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.61.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.61.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.61.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.62.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.62.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.62.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.63.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.63.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.63.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.64.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.64.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.64.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.65.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.65.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.65.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.66.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.66.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.66.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.67.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.67.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.67.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.68.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.68.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.68.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.69.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.69.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.69.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.70.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.70.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.70.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.71.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.71.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.71.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.72.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.72.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.72.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.73.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.73.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.73.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.74.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.74.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.74.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.75.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.75.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.75.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.76.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.76.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.76.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.77.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.77.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.77.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.78.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.78.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.78.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.79.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.79.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.79.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.80.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.80.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.80.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.81.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.81.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.81.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.82.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.82.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.82.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.83.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.83.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.83.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.84.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.84.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.84.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.85.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.85.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.85.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.86.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.86.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.86.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.87.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.87.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.87.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.88.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.88.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.88.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.89.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.89.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.89.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.90.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.90.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.90.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.91.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.91.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.91.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.92.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.92.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.92.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.93.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.93.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.93.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.94.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.94.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.94.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.95.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.95.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.95.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.96.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.96.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.96.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.97.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.97.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.97.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.98.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.98.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.98.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.99.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.99.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.99.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.100.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.100.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.100.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.101.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.101.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.101.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.102.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.102.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.102.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.103.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.103.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.103.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.104.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.104.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.104.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.105.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.105.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.105.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.106.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.106.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.106.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.107.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.107.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.107.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.108.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.108.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.108.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.109.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.109.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.109.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.110.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.110.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.110.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.111.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.111.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.111.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.112.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.112.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.112.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.113.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.113.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.113.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.114.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.114.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.114.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.115.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.115.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.115.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.116.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.116.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.116.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.117.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.117.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.117.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.118.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.118.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.118.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.119.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.119.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.119.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.120.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.120.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.120.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.121.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.121.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.121.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.122.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.122.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.122.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.123.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.123.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.123.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.124.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.124.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.124.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.125.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.125.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.125.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.126.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.126.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.126.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.127.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.127.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.127.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.128.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.128.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.128.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.129.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.129.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.129.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.130.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.130.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.130.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.131.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.131.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.131.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.132.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.132.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.132.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.133.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.133.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.133.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.134.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.134.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.134.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.135.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.135.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.135.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.136.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.136.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.136.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.137.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.137.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.137.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.138.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.138.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.138.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.139.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.139.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.139.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.140.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.140.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.140.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.141.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.141.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.141.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.142.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.142.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.142.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.143.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.143.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.143.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.144.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.144.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.144.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.145.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.145.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.145.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.146.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.146.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.146.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.147.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.147.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.147.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.148.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.148.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.148.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.149.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.149.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.149.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.150.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.150.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.150.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.151.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.151.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.151.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.152.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.152.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.152.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.153.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.153.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.153.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.154.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.154.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.154.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.155.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.155.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.155.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.156.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.156.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.156.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.157.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.157.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.157.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.158.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.158.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.158.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.159.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.159.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.159.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.160.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.160.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.160.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.161.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.161.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.161.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.162.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.162.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.162.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.163.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.163.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.163.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.164.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.164.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.164.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.165.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.165.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.165.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.166.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.166.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.166.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.167.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.167.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.167.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.168.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.168.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.168.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.169.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.169.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.169.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.170.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.170.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.170.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.171.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.171.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.171.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.172.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.172.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.172.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.173.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.173.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.173.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.174.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.174.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.174.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.175.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.175.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.175.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.176.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.176.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.176.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.177.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.177.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.177.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.178.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.178.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.178.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.179.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.179.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.179.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.180.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.180.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.180.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.181.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.181.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.181.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.182.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.182.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.182.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.183.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.183.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.183.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.184.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.184.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.184.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.185.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.185.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.185.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.186.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.186.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.186.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.187.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.187.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.187.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.188.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.188.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.188.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.189.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.189.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.189.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.190.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.190.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.190.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.191.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.191.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.191.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.192.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.192.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.192.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.193.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.193.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.193.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.194.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.194.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.194.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.195.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.195.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.195.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.196.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.196.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.196.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.197.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.197.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.197.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.198.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.198.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.198.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.199.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.199.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.199.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.200.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.200.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.200.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.201.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.201.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.201.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.202.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.202.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.202.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.203.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.203.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.203.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.204.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.204.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.204.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.205.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.205.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.205.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.206.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.206.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.206.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.207.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.207.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.207.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.208.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.208.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.208.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.209.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.209.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.209.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.210.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.210.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.210.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.211.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.211.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.211.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.212.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.212.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.212.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.213.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.213.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.213.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.214.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.214.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.214.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.215.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.215.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.215.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.216.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.216.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.216.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.217.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.217.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.217.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.218.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.218.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.218.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.219.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.219.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.219.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.220.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.220.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.220.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.221.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.221.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.221.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.222.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.222.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.222.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.223.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.223.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.223.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.224.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.224.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.224.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.225.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.225.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.225.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.226.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.226.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.226.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.227.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.227.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.227.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.228.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.228.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.228.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.229.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.229.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.229.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.230.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.230.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.230.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.231.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.231.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.231.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.232.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.232.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.232.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.233.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.233.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.233.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.234.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.234.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.234.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.235.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.235.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.235.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.236.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.236.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.236.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.237.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.237.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.237.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.238.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.238.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.238.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.239.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.239.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.239.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.240.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.240.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.240.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.241.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.241.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.241.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.242.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.242.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.242.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.243.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.243.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.243.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.244.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.244.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.244.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.245.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.245.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.245.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.246.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.246.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.246.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.247.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.247.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.247.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.248.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.248.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.248.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.249.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.249.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.249.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.250.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.250.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.250.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.251.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.251.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.251.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.252.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.252.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.252.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.253.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.253.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.253.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.254.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.254.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.254.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.255.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.255.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.255.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.input_layernorm.weight": "model-00144-of-000163.safetensors", + "model.layers.54.post_attention_layernorm.weight": "model-00144-of-000163.safetensors", + "model.layers.55.self_attn.q_a_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.self_attn.q_a_layernorm.weight": "model-00144-of-000163.safetensors", + "model.layers.55.self_attn.q_b_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.self_attn.kv_a_proj_with_mqa.weight": "model-00144-of-000163.safetensors", + "model.layers.55.self_attn.kv_a_layernorm.weight": "model-00144-of-000163.safetensors", + "model.layers.55.self_attn.kv_b_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.self_attn.o_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.gate.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.gate.e_score_correction_bias": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.shared_experts.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.shared_experts.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.shared_experts.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.0.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.0.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.0.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.1.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.1.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.1.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.2.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.2.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.2.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.3.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.3.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.3.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.4.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.4.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.4.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.5.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.5.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.5.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.6.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.6.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.6.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.7.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.7.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.7.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.8.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.8.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.8.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.9.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.9.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.9.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.10.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.10.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.10.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.11.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.11.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.11.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.12.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.12.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.12.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.13.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.13.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.13.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.14.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.14.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.14.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.15.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.15.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.15.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.16.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.16.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.16.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.17.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.17.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.17.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.18.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.18.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.18.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.19.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.19.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.19.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.20.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.20.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.20.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.21.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.21.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.21.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.22.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.22.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.22.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.23.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.23.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.23.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.24.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.24.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.24.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.25.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.25.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.25.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.26.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.26.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.26.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.27.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.27.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.27.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.28.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.28.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.28.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.29.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.29.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.29.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.30.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.30.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.30.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.31.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.31.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.31.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.32.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.32.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.32.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.33.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.33.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.33.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.34.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.34.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.34.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.35.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.35.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.35.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.36.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.36.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.36.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.37.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.37.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.37.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.38.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.38.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.38.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.39.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.39.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.39.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.40.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.40.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.40.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.41.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.41.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.41.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.42.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.42.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.42.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.43.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.43.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.43.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.44.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.44.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.44.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.45.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.45.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.45.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.46.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.46.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.46.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.47.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.47.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.47.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.48.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.48.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.48.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.49.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.49.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.49.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.50.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.50.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.50.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.51.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.51.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.51.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.52.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.52.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.52.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.53.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.53.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.53.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.54.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.54.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.54.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.55.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.55.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.55.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.56.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.56.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.56.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.57.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.57.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.57.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.58.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.58.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.58.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.59.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.59.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.59.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.60.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.60.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.60.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.61.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.61.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.61.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.62.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.62.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.62.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.63.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.63.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.63.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.64.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.64.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.64.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.65.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.65.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.65.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.66.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.66.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.66.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.67.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.67.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.67.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.68.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.68.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.68.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.69.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.69.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.69.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.70.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.70.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.70.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.71.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.71.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.71.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.72.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.72.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.72.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.73.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.73.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.73.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.74.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.74.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.74.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.75.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.75.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.75.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.76.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.76.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.76.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.77.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.77.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.77.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.78.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.78.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.78.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.79.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.79.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.79.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.80.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.80.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.80.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.81.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.81.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.81.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.82.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.82.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.82.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.83.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.83.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.83.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.84.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.84.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.84.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.85.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.85.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.85.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.86.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.86.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.86.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.87.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.87.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.87.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.88.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.88.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.88.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.89.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.89.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.89.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.90.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.90.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.90.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.91.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.91.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.91.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.92.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.92.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.92.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.93.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.93.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.93.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.94.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.94.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.94.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.95.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.95.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.95.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.96.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.96.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.96.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.97.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.97.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.97.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.98.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.98.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.98.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.99.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.99.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.99.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.100.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.100.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.100.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.101.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.101.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.101.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.102.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.102.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.102.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.103.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.103.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.103.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.104.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.104.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.104.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.105.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.105.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.105.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.106.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.106.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.106.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.107.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.107.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.107.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.108.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.108.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.108.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.109.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.109.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.109.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.110.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.110.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.110.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.111.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.111.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.111.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.112.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.112.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.112.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.113.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.113.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.113.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.114.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.114.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.114.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.115.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.115.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.115.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.116.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.116.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.116.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.117.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.117.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.117.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.118.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.118.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.118.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.119.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.119.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.119.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.120.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.120.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.120.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.121.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.121.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.121.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.122.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.122.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.122.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.123.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.123.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.123.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.124.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.124.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.124.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.125.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.125.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.125.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.126.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.126.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.126.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.127.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.127.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.127.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.128.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.128.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.128.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.129.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.129.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.129.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.130.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.130.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.130.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.131.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.131.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.131.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.132.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.132.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.132.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.133.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.133.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.133.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.134.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.134.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.134.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.135.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.135.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.135.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.136.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.136.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.136.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.137.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.137.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.137.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.138.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.138.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.138.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.139.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.139.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.139.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.140.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.140.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.140.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.141.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.141.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.141.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.142.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.142.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.142.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.143.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.143.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.143.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.144.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.144.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.144.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.145.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.145.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.145.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.146.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.146.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.146.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.147.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.147.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.147.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.148.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.148.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.148.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.149.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.149.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.149.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.150.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.150.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.150.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.151.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.151.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.151.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.152.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.152.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.152.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.153.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.153.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.153.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.154.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.154.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.154.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.155.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.155.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.155.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.156.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.156.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.156.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.157.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.157.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.157.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.158.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.158.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.158.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.159.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.159.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.159.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.160.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.160.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.160.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.161.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.161.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.161.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.162.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.162.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.162.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.163.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.163.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.163.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.164.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.164.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.164.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.165.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.165.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.165.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.166.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.166.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.166.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.167.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.167.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.167.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.168.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.168.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.168.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.169.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.169.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.169.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.170.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.170.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.170.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.171.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.171.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.171.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.172.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.172.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.172.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.173.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.173.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.173.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.174.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.174.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.174.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.175.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.175.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.175.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.176.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.176.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.176.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.177.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.177.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.177.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.178.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.178.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.178.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.179.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.179.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.179.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.180.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.180.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.180.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.181.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.181.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.181.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.182.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.182.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.182.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.183.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.183.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.183.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.184.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.184.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.184.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.185.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.185.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.185.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.186.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.186.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.186.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.187.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.187.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.187.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.188.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.188.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.188.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.189.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.189.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.189.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.190.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.190.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.190.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.191.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.191.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.191.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.192.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.192.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.192.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.193.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.193.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.193.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.194.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.194.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.194.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.195.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.195.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.195.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.196.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.196.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.196.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.197.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.197.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.197.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.198.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.198.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.198.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.199.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.199.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.199.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.200.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.200.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.200.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.201.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.201.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.201.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.202.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.202.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.202.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.203.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.203.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.203.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.204.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.204.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.204.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.205.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.205.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.205.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.206.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.206.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.206.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.207.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.207.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.207.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.208.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.208.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.208.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.209.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.209.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.209.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.210.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.210.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.210.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.211.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.211.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.211.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.212.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.212.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.212.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.213.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.213.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.213.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.214.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.214.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.214.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.215.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.215.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.215.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.216.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.216.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.216.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.217.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.217.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.217.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.218.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.218.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.218.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.219.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.219.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.219.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.220.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.220.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.220.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.221.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.221.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.221.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.222.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.222.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.222.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.223.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.223.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.223.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.224.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.224.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.224.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.225.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.225.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.225.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.226.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.226.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.226.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.227.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.227.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.227.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.228.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.228.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.228.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.229.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.229.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.229.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.230.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.230.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.230.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.231.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.231.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.231.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.232.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.232.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.232.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.233.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.233.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.233.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.234.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.234.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.234.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.235.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.235.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.235.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.236.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.236.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.236.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.237.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.237.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.237.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.238.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.238.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.238.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.239.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.239.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.239.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.240.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.240.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.240.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.241.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.241.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.241.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.242.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.242.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.242.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.243.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.243.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.243.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.244.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.244.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.244.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.245.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.245.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.245.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.246.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.246.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.246.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.247.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.247.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.247.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.248.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.248.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.248.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.249.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.249.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.249.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.250.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.250.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.250.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.251.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.251.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.251.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.252.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.252.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.252.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.253.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.253.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.253.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.254.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.254.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.254.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.255.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.255.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.255.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.input_layernorm.weight": "model-00147-of-000163.safetensors", + "model.layers.55.post_attention_layernorm.weight": "model-00147-of-000163.safetensors", + "model.layers.56.self_attn.q_a_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.self_attn.q_a_layernorm.weight": "model-00147-of-000163.safetensors", + "model.layers.56.self_attn.q_b_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.self_attn.kv_a_proj_with_mqa.weight": "model-00147-of-000163.safetensors", + "model.layers.56.self_attn.kv_a_layernorm.weight": "model-00147-of-000163.safetensors", + "model.layers.56.self_attn.kv_b_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.self_attn.o_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.gate.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.gate.e_score_correction_bias": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.shared_experts.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.shared_experts.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.shared_experts.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.0.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.0.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.0.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.1.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.1.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.1.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.2.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.2.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.2.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.3.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.3.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.3.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.4.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.4.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.4.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.5.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.5.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.5.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.6.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.6.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.6.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.7.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.7.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.7.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.8.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.8.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.8.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.9.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.9.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.9.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.10.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.10.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.10.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.11.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.11.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.11.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.12.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.12.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.12.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.13.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.13.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.13.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.14.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.14.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.14.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.15.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.15.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.15.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.16.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.16.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.16.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.17.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.17.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.17.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.18.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.18.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.18.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.19.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.19.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.19.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.20.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.20.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.20.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.21.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.21.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.21.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.22.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.22.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.22.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.23.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.23.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.23.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.24.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.24.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.24.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.25.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.25.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.25.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.26.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.26.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.26.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.27.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.27.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.27.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.28.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.28.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.28.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.29.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.29.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.29.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.30.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.30.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.30.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.31.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.31.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.31.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.32.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.32.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.32.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.33.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.33.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.33.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.34.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.34.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.34.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.35.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.35.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.35.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.36.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.36.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.36.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.37.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.37.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.37.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.38.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.38.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.38.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.39.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.39.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.39.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.40.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.40.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.40.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.41.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.41.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.41.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.42.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.42.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.42.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.43.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.43.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.43.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.44.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.44.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.44.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.45.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.45.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.45.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.46.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.46.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.46.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.47.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.47.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.47.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.48.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.48.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.48.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.49.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.49.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.49.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.50.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.50.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.50.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.51.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.51.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.51.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.52.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.52.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.52.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.53.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.53.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.53.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.54.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.54.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.54.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.55.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.55.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.55.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.56.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.56.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.56.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.57.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.57.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.57.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.58.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.58.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.58.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.59.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.59.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.59.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.60.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.60.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.60.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.61.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.61.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.61.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.62.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.62.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.62.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.63.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.63.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.63.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.64.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.64.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.64.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.65.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.65.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.65.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.66.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.66.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.66.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.67.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.67.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.67.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.68.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.68.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.68.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.69.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.69.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.69.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.70.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.70.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.70.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.71.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.71.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.71.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.72.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.72.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.72.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.73.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.73.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.73.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.74.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.74.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.74.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.75.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.75.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.75.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.76.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.76.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.76.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.77.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.77.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.77.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.78.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.78.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.78.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.79.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.79.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.79.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.80.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.80.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.80.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.81.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.81.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.81.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.82.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.82.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.82.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.83.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.83.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.83.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.84.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.84.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.84.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.85.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.85.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.85.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.86.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.86.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.86.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.87.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.87.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.87.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.88.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.88.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.88.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.89.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.89.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.89.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.90.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.90.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.90.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.91.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.91.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.91.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.92.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.92.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.92.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.93.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.93.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.93.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.94.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.94.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.94.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.95.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.95.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.95.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.96.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.96.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.96.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.97.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.97.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.97.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.98.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.98.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.98.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.99.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.99.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.99.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.100.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.100.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.100.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.101.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.101.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.101.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.102.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.102.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.102.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.103.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.103.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.103.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.104.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.104.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.104.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.105.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.105.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.105.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.106.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.106.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.106.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.107.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.107.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.107.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.108.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.108.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.108.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.109.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.109.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.109.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.110.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.110.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.110.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.111.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.111.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.111.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.112.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.112.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.112.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.113.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.113.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.113.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.114.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.114.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.114.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.115.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.115.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.115.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.116.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.116.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.116.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.117.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.117.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.117.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.118.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.118.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.118.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.119.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.119.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.119.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.120.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.120.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.120.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.121.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.121.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.121.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.122.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.122.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.122.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.123.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.123.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.123.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.124.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.124.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.124.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.125.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.125.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.125.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.126.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.126.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.126.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.127.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.127.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.127.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.128.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.128.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.128.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.129.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.129.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.129.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.130.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.130.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.130.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.131.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.131.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.131.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.132.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.132.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.132.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.133.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.133.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.133.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.134.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.134.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.134.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.135.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.135.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.135.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.136.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.136.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.136.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.137.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.137.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.137.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.138.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.138.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.138.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.139.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.139.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.139.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.140.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.140.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.140.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.141.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.141.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.141.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.142.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.142.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.142.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.143.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.143.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.143.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.144.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.144.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.144.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.145.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.145.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.145.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.146.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.146.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.146.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.147.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.147.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.147.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.148.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.148.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.148.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.149.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.149.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.149.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.150.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.150.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.150.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.151.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.151.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.151.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.152.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.152.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.152.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.153.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.153.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.153.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.154.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.154.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.154.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.155.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.155.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.155.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.156.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.156.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.156.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.157.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.157.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.157.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.158.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.158.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.158.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.159.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.159.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.159.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.160.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.160.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.160.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.161.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.161.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.161.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.162.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.162.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.162.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.163.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.163.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.163.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.164.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.164.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.164.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.165.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.165.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.165.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.166.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.166.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.166.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.167.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.167.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.167.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.168.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.168.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.168.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.169.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.169.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.169.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.170.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.170.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.170.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.171.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.171.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.171.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.172.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.172.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.172.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.173.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.173.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.173.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.174.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.174.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.174.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.175.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.175.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.175.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.176.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.176.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.176.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.177.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.177.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.177.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.178.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.178.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.178.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.179.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.179.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.179.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.180.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.180.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.180.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.181.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.181.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.181.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.182.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.182.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.182.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.183.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.183.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.183.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.184.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.184.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.184.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.185.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.185.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.185.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.186.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.186.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.186.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.187.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.187.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.187.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.188.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.188.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.188.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.189.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.189.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.189.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.190.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.190.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.190.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.191.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.191.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.191.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.192.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.192.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.192.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.193.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.193.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.193.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.194.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.194.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.194.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.195.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.195.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.195.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.196.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.196.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.196.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.197.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.197.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.197.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.198.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.198.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.198.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.199.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.199.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.199.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.200.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.200.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.200.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.201.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.201.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.201.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.202.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.202.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.202.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.203.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.203.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.203.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.204.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.204.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.204.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.205.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.205.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.205.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.206.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.206.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.206.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.207.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.207.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.207.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.208.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.208.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.208.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.209.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.209.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.209.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.210.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.210.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.210.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.211.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.211.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.211.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.212.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.212.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.212.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.213.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.213.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.213.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.214.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.214.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.214.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.215.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.215.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.215.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.216.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.216.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.216.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.217.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.217.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.217.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.218.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.218.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.218.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.219.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.219.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.219.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.220.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.220.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.220.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.221.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.221.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.221.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.222.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.222.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.222.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.223.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.223.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.223.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.224.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.224.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.224.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.225.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.225.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.225.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.226.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.226.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.226.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.227.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.227.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.227.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.228.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.228.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.228.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.229.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.229.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.229.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.230.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.230.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.230.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.231.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.231.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.231.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.232.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.232.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.232.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.233.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.233.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.233.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.234.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.234.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.234.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.235.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.235.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.235.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.236.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.236.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.236.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.237.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.237.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.237.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.238.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.238.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.238.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.239.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.239.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.239.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.240.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.240.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.240.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.241.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.241.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.241.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.242.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.242.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.242.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.243.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.243.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.243.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.244.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.244.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.244.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.245.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.245.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.245.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.246.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.246.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.246.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.247.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.247.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.247.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.248.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.248.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.248.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.249.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.249.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.249.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.250.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.250.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.250.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.251.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.251.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.251.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.252.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.252.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.252.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.253.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.253.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.56.mlp.experts.253.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.56.mlp.experts.254.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.56.mlp.experts.254.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.56.mlp.experts.254.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.56.mlp.experts.255.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.56.mlp.experts.255.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.56.mlp.experts.255.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.56.input_layernorm.weight": "model-00150-of-000163.safetensors", + "model.layers.56.post_attention_layernorm.weight": "model-00150-of-000163.safetensors", + "model.layers.57.self_attn.q_a_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.self_attn.q_a_layernorm.weight": "model-00150-of-000163.safetensors", + "model.layers.57.self_attn.q_b_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.self_attn.kv_a_proj_with_mqa.weight": "model-00150-of-000163.safetensors", + "model.layers.57.self_attn.kv_a_layernorm.weight": "model-00150-of-000163.safetensors", + "model.layers.57.self_attn.kv_b_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.self_attn.o_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.gate.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.gate.e_score_correction_bias": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.shared_experts.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.shared_experts.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.shared_experts.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.0.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.0.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.0.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.1.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.1.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.1.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.2.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.2.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.2.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.3.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.3.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.3.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.4.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.4.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.4.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.5.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.5.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.5.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.6.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.6.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.6.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.7.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.7.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.7.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.8.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.8.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.8.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.9.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.9.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.9.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.10.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.10.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.10.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.11.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.11.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.11.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.12.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.12.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.12.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.13.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.13.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.13.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.14.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.14.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.14.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.15.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.15.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.15.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.16.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.16.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.16.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.17.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.17.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.17.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.18.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.18.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.18.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.19.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.19.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.19.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.20.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.20.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.20.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.21.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.21.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.21.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.22.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.22.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.22.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.23.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.23.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.23.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.24.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.24.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.24.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.25.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.25.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.25.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.26.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.26.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.26.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.27.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.27.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.27.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.28.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.28.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.28.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.29.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.29.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.29.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.30.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.30.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.30.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.31.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.31.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.31.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.32.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.32.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.32.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.33.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.33.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.33.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.34.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.34.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.34.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.35.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.35.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.35.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.36.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.36.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.36.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.37.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.37.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.37.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.38.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.38.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.38.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.39.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.39.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.39.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.40.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.40.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.40.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.41.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.41.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.41.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.42.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.42.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.42.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.43.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.43.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.43.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.44.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.44.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.44.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.45.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.45.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.45.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.46.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.46.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.46.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.47.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.47.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.47.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.48.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.48.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.48.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.49.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.49.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.49.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.50.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.50.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.50.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.51.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.51.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.51.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.52.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.52.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.52.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.53.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.53.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.53.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.54.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.54.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.54.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.55.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.55.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.55.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.56.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.56.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.56.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.57.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.57.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.57.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.58.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.58.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.58.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.59.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.59.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.59.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.60.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.60.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.60.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.61.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.61.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.61.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.62.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.62.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.62.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.63.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.63.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.63.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.64.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.64.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.64.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.65.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.65.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.65.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.66.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.66.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.66.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.67.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.67.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.67.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.68.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.68.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.68.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.69.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.69.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.69.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.70.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.70.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.70.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.71.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.71.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.71.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.72.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.72.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.72.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.73.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.73.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.73.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.74.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.74.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.74.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.75.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.75.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.75.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.76.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.76.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.76.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.77.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.77.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.77.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.78.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.78.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.78.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.79.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.79.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.79.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.80.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.80.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.80.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.81.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.81.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.81.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.82.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.82.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.82.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.83.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.83.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.83.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.84.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.84.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.84.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.85.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.85.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.85.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.86.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.86.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.86.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.87.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.87.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.87.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.88.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.88.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.88.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.89.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.89.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.89.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.90.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.90.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.90.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.91.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.91.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.91.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.92.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.92.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.92.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.93.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.93.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.93.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.94.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.94.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.94.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.95.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.95.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.95.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.96.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.96.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.96.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.97.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.97.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.97.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.98.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.98.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.98.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.99.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.99.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.99.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.100.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.100.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.100.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.101.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.101.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.101.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.102.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.102.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.102.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.103.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.103.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.103.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.104.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.104.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.104.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.105.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.105.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.105.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.106.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.106.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.106.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.107.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.107.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.107.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.108.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.108.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.108.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.109.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.109.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.109.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.110.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.110.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.110.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.111.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.111.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.111.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.112.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.112.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.112.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.113.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.113.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.113.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.114.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.114.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.114.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.115.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.115.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.115.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.116.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.116.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.116.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.117.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.117.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.117.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.118.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.118.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.118.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.119.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.119.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.119.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.120.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.120.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.120.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.121.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.121.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.121.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.122.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.122.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.122.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.123.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.123.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.123.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.124.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.124.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.124.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.125.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.125.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.125.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.126.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.126.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.126.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.127.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.127.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.127.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.128.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.128.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.128.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.129.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.129.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.129.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.130.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.130.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.130.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.131.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.131.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.131.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.132.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.132.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.132.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.133.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.133.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.133.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.134.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.134.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.134.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.135.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.135.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.135.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.136.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.136.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.136.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.137.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.137.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.137.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.138.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.138.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.138.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.139.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.139.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.139.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.140.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.140.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.140.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.141.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.141.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.141.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.142.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.142.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.142.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.143.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.143.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.143.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.144.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.144.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.144.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.145.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.145.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.145.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.146.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.146.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.146.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.147.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.147.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.147.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.148.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.148.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.148.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.149.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.149.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.149.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.150.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.150.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.150.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.151.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.151.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.151.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.152.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.152.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.152.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.153.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.153.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.153.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.154.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.154.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.154.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.155.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.155.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.155.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.156.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.156.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.156.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.157.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.157.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.157.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.158.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.158.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.158.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.159.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.159.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.159.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.160.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.160.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.160.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.161.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.161.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.161.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.162.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.162.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.162.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.163.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.163.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.163.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.164.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.164.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.164.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.165.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.165.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.165.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.166.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.166.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.166.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.167.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.167.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.167.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.168.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.168.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.168.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.169.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.169.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.169.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.170.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.170.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.170.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.171.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.171.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.171.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.172.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.172.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.172.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.173.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.173.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.173.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.174.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.174.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.174.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.175.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.175.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.175.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.176.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.176.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.176.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.177.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.177.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.177.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.178.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.178.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.178.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.179.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.179.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.179.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.180.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.180.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.180.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.181.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.181.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.181.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.182.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.182.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.182.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.183.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.183.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.183.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.184.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.184.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.184.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.185.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.185.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.185.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.186.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.186.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.186.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.187.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.187.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.187.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.188.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.188.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.188.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.189.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.189.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.189.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.190.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.190.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.190.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.191.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.191.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.191.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.192.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.192.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.192.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.193.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.193.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.193.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.194.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.194.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.194.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.195.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.195.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.195.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.196.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.196.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.196.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.197.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.197.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.197.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.198.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.198.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.198.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.199.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.199.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.199.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.200.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.200.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.200.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.201.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.201.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.201.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.202.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.202.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.202.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.203.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.203.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.203.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.204.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.204.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.204.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.205.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.205.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.205.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.206.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.206.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.206.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.207.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.207.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.207.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.208.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.208.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.208.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.209.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.209.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.209.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.210.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.210.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.210.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.211.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.211.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.211.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.212.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.212.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.212.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.213.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.213.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.213.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.214.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.214.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.214.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.215.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.215.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.215.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.216.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.216.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.216.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.217.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.217.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.217.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.218.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.218.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.218.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.219.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.219.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.219.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.220.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.220.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.220.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.221.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.221.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.221.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.222.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.222.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.222.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.223.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.223.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.223.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.224.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.224.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.224.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.225.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.225.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.225.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.226.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.226.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.226.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.227.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.227.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.227.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.228.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.228.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.228.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.229.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.229.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.229.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.230.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.230.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.230.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.231.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.231.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.231.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.232.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.232.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.232.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.233.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.233.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.233.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.234.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.234.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.234.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.235.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.235.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.235.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.236.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.236.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.236.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.237.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.237.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.237.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.238.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.238.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.238.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.239.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.239.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.239.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.240.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.240.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.240.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.241.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.241.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.241.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.242.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.242.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.242.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.243.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.243.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.243.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.244.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.244.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.244.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.245.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.245.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.245.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.246.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.246.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.246.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.247.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.247.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.247.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.248.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.248.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.248.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.249.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.249.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.249.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.250.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.250.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.250.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.251.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.251.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.251.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.252.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.252.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.252.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.253.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.253.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.253.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.254.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.254.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.254.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.255.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.255.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.255.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.input_layernorm.weight": "model-00152-of-000163.safetensors", + "model.layers.57.post_attention_layernorm.weight": "model-00152-of-000163.safetensors", + "model.layers.58.self_attn.q_a_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.self_attn.q_a_layernorm.weight": "model-00152-of-000163.safetensors", + "model.layers.58.self_attn.q_b_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.self_attn.kv_a_proj_with_mqa.weight": "model-00152-of-000163.safetensors", + "model.layers.58.self_attn.kv_a_layernorm.weight": "model-00152-of-000163.safetensors", + "model.layers.58.self_attn.kv_b_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.self_attn.o_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.gate.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.gate.e_score_correction_bias": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.shared_experts.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.shared_experts.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.shared_experts.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.0.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.0.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.0.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.1.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.1.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.1.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.2.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.2.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.2.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.3.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.3.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.3.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.4.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.4.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.4.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.5.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.5.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.5.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.6.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.6.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.6.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.7.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.7.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.7.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.8.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.8.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.8.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.9.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.9.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.9.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.10.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.10.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.10.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.11.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.11.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.11.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.12.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.12.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.12.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.13.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.13.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.13.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.14.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.14.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.14.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.15.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.15.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.15.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.16.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.16.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.16.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.17.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.17.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.17.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.18.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.18.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.18.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.19.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.19.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.19.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.20.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.20.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.20.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.21.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.21.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.21.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.22.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.22.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.22.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.23.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.23.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.23.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.24.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.24.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.24.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.25.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.25.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.25.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.26.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.26.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.26.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.27.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.27.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.27.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.28.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.28.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.28.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.29.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.29.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.29.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.30.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.30.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.30.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.31.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.31.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.31.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.32.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.32.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.32.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.33.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.33.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.33.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.34.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.34.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.34.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.35.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.35.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.35.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.36.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.36.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.36.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.37.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.37.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.37.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.38.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.38.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.38.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.39.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.39.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.39.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.40.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.40.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.40.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.41.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.41.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.41.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.42.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.42.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.42.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.43.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.43.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.43.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.44.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.44.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.44.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.45.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.45.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.45.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.46.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.46.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.46.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.47.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.47.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.47.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.48.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.48.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.48.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.49.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.49.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.49.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.50.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.50.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.50.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.51.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.51.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.51.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.52.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.52.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.52.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.53.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.53.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.53.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.54.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.54.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.54.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.55.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.55.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.55.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.56.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.56.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.56.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.57.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.57.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.57.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.58.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.58.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.58.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.59.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.59.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.59.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.60.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.60.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.60.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.61.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.61.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.61.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.62.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.62.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.62.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.63.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.63.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.63.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.64.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.64.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.64.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.65.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.65.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.65.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.66.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.66.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.66.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.67.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.67.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.67.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.68.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.68.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.68.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.69.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.69.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.69.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.70.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.70.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.70.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.71.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.71.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.71.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.72.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.72.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.72.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.73.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.73.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.73.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.74.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.74.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.74.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.75.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.75.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.75.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.76.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.76.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.76.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.77.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.77.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.77.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.78.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.78.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.78.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.79.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.79.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.79.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.80.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.80.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.80.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.81.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.81.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.81.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.82.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.82.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.82.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.83.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.83.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.83.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.84.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.84.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.84.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.85.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.85.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.85.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.86.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.86.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.86.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.87.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.87.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.87.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.88.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.88.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.88.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.89.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.89.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.89.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.90.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.90.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.90.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.91.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.91.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.91.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.92.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.92.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.92.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.93.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.93.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.93.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.94.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.94.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.94.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.95.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.95.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.95.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.96.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.96.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.96.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.97.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.97.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.97.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.98.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.98.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.98.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.99.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.99.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.99.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.100.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.100.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.100.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.101.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.101.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.101.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.102.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.102.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.102.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.103.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.103.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.103.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.104.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.104.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.104.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.105.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.105.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.105.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.106.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.106.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.106.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.107.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.107.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.107.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.108.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.108.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.108.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.109.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.109.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.109.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.110.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.110.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.110.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.111.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.111.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.111.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.112.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.112.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.112.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.113.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.113.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.113.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.114.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.114.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.114.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.115.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.115.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.115.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.116.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.116.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.116.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.117.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.117.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.117.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.118.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.118.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.118.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.119.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.119.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.119.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.120.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.120.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.120.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.121.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.121.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.121.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.122.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.122.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.122.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.123.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.123.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.123.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.124.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.124.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.124.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.125.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.125.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.125.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.126.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.126.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.126.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.127.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.127.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.127.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.128.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.128.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.128.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.129.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.129.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.129.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.130.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.130.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.130.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.131.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.131.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.131.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.132.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.132.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.132.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.133.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.133.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.133.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.134.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.134.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.134.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.135.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.135.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.135.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.136.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.136.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.136.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.137.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.137.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.137.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.138.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.138.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.138.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.139.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.139.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.139.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.140.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.140.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.140.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.141.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.141.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.141.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.142.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.142.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.142.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.143.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.143.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.143.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.144.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.144.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.144.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.145.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.145.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.145.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.146.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.146.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.146.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.147.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.147.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.147.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.148.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.148.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.148.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.149.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.149.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.149.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.150.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.150.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.150.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.151.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.151.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.151.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.152.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.152.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.152.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.153.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.153.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.153.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.154.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.154.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.154.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.155.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.155.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.155.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.156.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.156.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.156.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.157.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.157.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.157.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.158.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.158.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.158.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.159.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.159.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.159.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.160.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.160.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.160.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.161.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.161.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.161.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.162.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.162.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.162.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.163.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.163.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.163.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.164.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.164.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.164.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.165.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.165.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.165.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.166.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.166.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.166.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.167.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.167.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.167.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.168.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.168.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.168.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.169.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.169.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.169.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.170.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.170.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.170.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.171.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.171.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.171.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.172.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.172.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.172.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.173.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.173.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.173.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.174.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.174.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.174.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.175.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.175.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.175.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.176.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.176.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.176.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.177.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.177.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.177.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.178.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.178.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.178.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.179.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.179.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.179.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.180.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.180.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.180.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.181.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.181.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.181.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.182.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.182.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.182.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.183.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.183.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.183.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.184.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.184.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.184.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.185.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.185.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.185.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.186.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.186.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.186.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.187.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.187.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.187.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.188.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.188.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.188.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.189.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.189.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.189.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.190.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.190.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.190.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.191.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.191.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.191.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.192.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.192.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.192.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.193.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.193.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.193.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.194.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.194.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.194.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.195.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.195.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.195.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.196.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.196.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.196.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.197.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.197.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.197.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.198.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.198.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.198.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.199.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.199.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.199.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.200.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.200.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.200.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.201.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.201.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.201.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.202.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.202.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.202.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.203.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.203.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.203.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.204.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.204.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.204.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.205.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.205.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.205.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.206.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.206.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.206.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.207.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.207.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.207.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.208.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.208.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.208.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.209.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.209.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.209.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.210.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.210.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.210.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.211.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.211.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.211.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.212.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.212.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.212.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.213.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.213.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.213.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.214.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.214.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.214.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.215.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.215.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.215.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.216.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.216.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.216.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.217.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.217.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.217.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.218.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.218.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.218.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.219.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.219.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.219.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.220.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.220.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.220.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.221.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.221.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.221.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.222.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.222.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.222.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.223.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.223.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.223.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.224.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.224.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.224.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.225.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.225.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.225.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.226.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.226.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.226.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.227.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.227.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.227.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.228.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.228.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.228.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.229.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.229.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.229.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.230.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.230.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.230.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.231.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.231.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.231.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.232.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.232.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.232.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.233.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.233.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.233.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.234.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.234.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.234.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.235.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.235.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.235.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.236.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.236.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.236.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.237.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.237.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.237.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.238.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.238.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.238.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.239.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.239.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.239.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.240.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.240.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.240.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.241.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.241.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.241.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.242.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.242.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.242.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.243.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.243.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.243.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.244.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.244.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.244.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.245.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.245.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.245.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.246.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.246.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.246.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.247.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.247.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.247.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.248.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.248.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.248.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.249.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.249.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.249.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.250.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.250.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.250.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.251.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.251.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.251.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.252.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.252.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.252.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.253.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.253.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.253.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.254.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.254.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.254.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.255.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.255.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.255.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.input_layernorm.weight": "model-00155-of-000163.safetensors", + "model.layers.58.post_attention_layernorm.weight": "model-00155-of-000163.safetensors", + "model.layers.59.self_attn.q_a_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.self_attn.q_a_layernorm.weight": "model-00155-of-000163.safetensors", + "model.layers.59.self_attn.q_b_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.self_attn.kv_a_proj_with_mqa.weight": "model-00155-of-000163.safetensors", + "model.layers.59.self_attn.kv_a_layernorm.weight": "model-00155-of-000163.safetensors", + "model.layers.59.self_attn.kv_b_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.self_attn.o_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.gate.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.gate.e_score_correction_bias": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.shared_experts.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.shared_experts.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.shared_experts.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.0.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.0.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.0.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.1.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.1.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.1.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.2.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.2.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.2.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.3.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.3.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.3.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.4.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.4.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.4.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.5.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.5.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.5.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.6.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.6.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.6.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.7.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.7.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.7.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.8.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.8.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.8.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.9.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.9.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.9.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.10.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.10.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.10.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.11.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.11.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.11.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.12.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.12.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.12.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.13.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.13.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.13.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.14.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.14.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.14.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.15.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.15.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.15.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.16.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.16.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.16.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.17.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.17.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.17.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.18.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.18.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.18.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.19.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.19.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.19.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.20.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.20.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.20.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.21.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.21.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.21.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.22.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.22.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.22.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.23.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.23.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.23.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.24.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.24.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.24.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.25.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.25.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.25.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.26.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.26.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.26.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.27.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.27.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.27.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.28.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.28.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.28.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.29.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.29.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.29.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.30.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.30.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.30.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.31.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.31.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.31.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.32.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.32.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.32.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.33.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.33.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.33.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.34.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.34.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.34.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.35.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.35.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.35.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.36.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.36.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.36.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.37.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.37.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.37.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.38.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.38.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.38.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.39.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.39.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.39.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.40.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.40.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.40.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.41.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.41.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.41.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.42.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.42.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.42.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.43.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.43.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.43.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.44.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.44.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.44.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.45.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.45.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.45.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.46.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.46.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.46.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.47.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.47.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.47.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.48.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.48.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.48.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.49.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.49.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.49.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.50.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.50.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.50.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.51.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.51.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.51.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.52.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.52.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.52.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.53.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.53.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.53.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.54.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.54.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.54.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.55.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.55.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.55.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.56.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.56.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.56.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.57.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.57.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.57.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.58.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.58.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.58.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.59.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.59.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.59.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.60.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.60.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.60.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.61.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.61.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.61.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.62.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.62.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.62.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.63.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.63.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.63.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.64.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.64.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.64.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.65.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.65.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.65.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.66.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.66.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.66.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.67.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.67.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.67.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.68.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.68.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.68.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.69.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.69.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.69.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.70.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.70.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.70.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.71.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.71.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.71.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.72.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.72.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.72.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.73.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.73.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.73.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.74.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.74.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.74.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.75.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.75.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.75.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.76.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.76.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.76.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.77.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.77.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.77.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.78.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.78.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.78.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.79.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.79.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.79.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.80.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.80.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.80.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.81.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.81.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.81.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.82.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.82.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.82.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.83.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.83.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.83.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.84.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.84.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.84.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.85.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.85.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.85.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.86.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.86.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.86.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.87.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.87.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.87.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.88.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.88.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.88.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.89.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.89.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.89.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.90.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.90.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.90.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.91.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.91.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.91.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.92.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.92.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.92.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.93.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.93.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.93.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.94.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.94.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.94.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.95.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.95.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.95.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.96.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.96.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.96.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.97.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.97.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.97.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.98.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.98.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.98.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.99.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.99.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.99.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.100.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.100.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.100.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.101.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.101.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.101.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.102.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.102.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.102.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.103.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.103.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.103.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.104.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.104.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.104.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.105.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.105.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.105.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.106.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.106.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.106.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.107.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.107.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.107.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.108.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.108.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.108.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.109.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.109.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.109.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.110.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.110.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.110.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.111.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.111.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.111.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.112.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.112.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.112.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.113.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.113.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.113.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.114.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.114.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.114.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.115.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.115.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.115.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.116.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.116.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.116.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.117.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.117.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.117.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.118.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.118.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.118.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.119.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.119.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.119.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.120.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.120.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.120.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.121.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.121.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.121.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.122.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.122.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.122.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.123.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.123.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.123.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.124.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.124.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.124.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.125.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.125.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.125.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.126.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.126.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.126.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.127.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.127.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.127.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.128.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.128.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.128.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.129.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.129.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.129.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.130.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.130.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.130.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.131.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.131.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.131.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.132.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.132.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.132.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.133.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.133.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.133.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.134.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.134.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.134.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.135.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.135.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.135.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.136.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.136.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.136.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.137.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.137.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.137.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.138.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.138.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.138.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.139.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.139.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.139.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.140.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.140.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.140.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.141.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.141.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.141.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.142.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.142.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.142.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.143.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.143.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.143.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.144.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.144.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.144.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.145.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.145.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.145.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.146.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.146.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.146.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.147.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.147.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.147.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.148.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.148.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.148.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.149.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.149.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.149.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.150.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.150.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.150.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.151.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.151.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.151.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.152.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.152.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.152.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.153.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.153.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.153.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.154.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.154.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.154.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.155.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.155.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.155.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.156.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.156.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.156.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.157.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.157.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.157.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.158.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.158.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.158.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.159.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.159.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.159.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.160.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.160.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.160.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.161.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.161.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.161.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.162.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.162.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.162.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.163.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.163.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.163.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.164.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.164.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.164.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.165.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.165.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.165.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.166.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.166.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.166.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.167.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.167.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.167.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.168.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.168.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.168.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.169.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.169.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.169.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.170.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.170.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.170.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.171.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.171.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.171.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.172.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.172.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.172.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.173.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.173.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.173.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.174.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.174.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.174.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.175.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.175.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.175.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.176.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.176.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.176.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.177.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.177.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.177.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.178.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.178.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.178.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.179.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.179.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.179.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.180.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.180.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.180.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.181.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.181.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.181.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.182.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.182.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.182.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.183.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.183.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.183.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.184.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.184.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.184.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.185.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.185.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.185.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.186.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.186.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.186.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.187.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.187.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.187.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.188.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.188.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.188.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.189.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.189.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.189.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.190.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.190.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.190.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.191.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.191.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.191.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.192.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.192.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.192.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.193.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.193.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.193.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.194.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.194.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.194.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.195.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.195.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.195.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.196.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.196.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.196.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.197.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.197.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.197.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.198.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.198.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.198.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.199.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.199.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.199.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.200.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.200.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.200.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.201.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.201.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.201.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.202.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.202.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.202.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.203.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.203.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.203.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.204.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.204.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.204.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.205.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.205.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.205.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.206.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.206.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.206.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.207.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.207.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.207.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.208.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.208.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.208.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.209.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.209.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.209.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.210.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.210.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.210.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.211.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.211.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.211.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.212.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.212.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.212.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.213.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.213.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.213.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.214.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.214.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.214.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.215.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.215.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.215.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.216.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.216.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.216.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.217.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.217.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.217.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.218.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.218.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.218.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.219.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.219.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.219.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.220.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.220.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.220.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.221.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.221.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.221.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.222.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.222.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.222.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.223.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.223.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.223.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.224.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.224.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.224.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.225.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.225.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.225.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.226.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.226.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.226.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.227.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.227.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.227.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.228.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.228.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.228.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.229.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.229.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.229.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.230.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.230.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.230.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.231.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.231.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.231.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.232.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.232.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.232.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.233.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.233.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.233.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.234.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.234.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.234.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.235.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.235.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.235.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.236.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.236.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.236.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.237.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.237.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.237.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.238.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.238.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.238.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.239.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.239.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.239.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.240.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.240.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.240.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.241.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.241.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.241.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.242.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.242.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.242.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.243.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.243.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.243.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.244.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.244.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.244.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.245.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.245.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.245.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.246.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.246.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.246.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.247.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.247.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.247.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.248.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.248.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.248.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.249.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.249.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.249.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.250.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.250.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.250.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.251.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.251.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.251.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.252.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.252.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.252.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.253.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.253.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.253.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.254.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.254.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.254.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.255.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.255.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.255.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.input_layernorm.weight": "model-00158-of-000163.safetensors", + "model.layers.59.post_attention_layernorm.weight": "model-00158-of-000163.safetensors", + "model.layers.60.self_attn.q_a_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.self_attn.q_a_layernorm.weight": "model-00158-of-000163.safetensors", + "model.layers.60.self_attn.q_b_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.self_attn.kv_a_proj_with_mqa.weight": "model-00158-of-000163.safetensors", + "model.layers.60.self_attn.kv_a_layernorm.weight": "model-00158-of-000163.safetensors", + "model.layers.60.self_attn.kv_b_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.self_attn.o_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.gate.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.gate.e_score_correction_bias": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.shared_experts.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.shared_experts.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.shared_experts.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.0.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.0.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.0.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.1.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.1.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.1.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.2.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.2.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.2.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.3.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.3.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.3.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.4.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.4.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.4.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.5.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.5.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.5.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.6.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.6.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.6.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.7.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.7.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.7.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.8.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.8.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.8.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.9.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.9.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.9.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.10.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.10.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.10.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.11.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.11.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.11.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.12.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.12.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.12.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.13.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.13.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.13.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.14.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.14.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.14.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.15.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.15.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.15.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.16.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.16.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.16.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.17.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.17.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.17.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.18.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.18.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.18.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.19.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.19.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.19.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.20.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.20.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.20.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.21.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.21.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.21.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.22.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.22.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.22.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.23.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.23.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.23.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.24.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.24.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.24.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.25.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.25.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.25.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.26.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.26.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.26.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.27.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.27.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.27.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.28.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.28.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.28.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.29.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.29.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.29.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.30.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.30.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.30.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.31.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.31.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.31.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.32.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.32.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.32.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.33.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.33.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.33.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.34.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.34.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.34.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.35.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.35.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.35.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.36.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.36.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.36.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.37.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.37.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.37.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.38.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.38.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.38.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.39.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.39.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.39.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.40.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.40.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.40.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.41.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.41.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.41.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.42.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.42.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.42.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.43.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.43.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.43.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.44.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.44.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.44.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.45.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.45.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.45.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.46.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.46.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.46.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.47.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.47.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.47.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.48.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.48.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.48.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.49.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.49.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.49.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.50.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.50.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.50.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.51.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.51.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.51.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.52.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.52.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.52.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.53.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.53.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.53.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.54.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.54.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.54.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.55.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.55.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.55.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.56.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.56.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.56.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.57.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.57.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.57.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.58.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.58.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.58.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.59.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.59.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.59.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.60.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.60.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.60.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.61.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.61.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.61.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.62.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.62.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.62.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.63.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.63.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.63.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.64.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.64.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.64.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.65.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.65.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.65.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.66.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.66.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.66.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.67.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.67.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.67.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.68.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.68.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.68.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.69.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.69.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.69.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.70.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.70.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.70.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.71.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.71.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.71.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.72.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.72.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.72.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.73.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.73.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.73.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.74.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.74.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.74.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.75.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.75.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.75.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.76.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.76.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.76.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.77.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.77.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.77.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.78.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.78.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.78.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.79.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.79.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.79.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.80.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.80.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.80.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.81.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.81.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.81.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.82.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.82.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.82.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.83.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.83.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.83.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.84.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.84.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.84.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.85.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.85.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.85.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.86.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.86.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.86.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.87.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.87.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.87.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.88.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.88.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.88.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.89.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.89.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.89.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.90.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.90.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.90.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.91.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.91.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.91.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.92.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.92.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.92.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.93.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.93.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.93.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.94.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.94.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.94.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.95.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.95.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.95.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.96.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.96.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.96.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.97.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.97.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.97.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.98.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.98.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.98.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.99.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.99.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.99.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.100.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.100.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.100.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.101.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.101.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.101.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.102.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.102.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.102.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.103.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.103.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.103.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.104.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.104.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.104.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.105.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.105.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.105.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.106.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.106.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.106.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.107.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.107.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.107.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.108.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.108.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.108.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.109.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.109.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.109.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.110.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.110.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.110.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.111.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.111.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.111.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.112.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.112.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.112.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.113.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.113.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.113.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.114.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.114.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.114.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.115.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.115.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.115.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.116.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.116.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.116.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.117.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.117.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.117.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.118.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.118.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.118.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.119.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.119.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.119.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.120.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.120.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.120.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.121.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.121.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.121.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.122.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.122.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.122.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.123.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.123.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.123.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.124.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.124.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.124.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.125.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.125.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.125.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.126.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.126.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.126.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.127.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.127.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.127.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.128.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.128.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.128.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.129.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.129.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.129.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.130.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.130.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.130.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.131.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.131.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.131.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.132.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.132.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.132.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.133.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.133.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.133.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.134.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.134.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.134.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.135.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.135.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.135.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.136.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.136.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.136.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.137.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.137.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.137.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.138.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.138.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.138.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.139.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.139.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.139.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.140.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.140.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.140.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.141.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.141.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.141.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.142.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.142.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.142.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.143.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.143.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.143.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.144.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.144.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.144.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.145.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.145.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.145.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.146.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.146.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.146.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.147.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.147.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.147.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.148.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.148.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.148.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.149.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.149.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.149.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.150.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.150.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.150.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.151.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.151.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.151.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.152.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.152.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.152.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.153.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.153.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.153.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.154.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.154.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.154.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.155.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.155.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.155.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.156.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.156.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.156.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.157.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.157.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.157.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.158.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.158.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.158.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.159.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.159.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.159.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.160.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.160.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.160.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.161.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.161.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.161.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.162.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.162.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.162.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.163.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.163.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.163.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.164.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.164.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.164.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.165.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.165.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.165.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.166.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.166.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.166.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.167.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.167.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.167.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.168.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.168.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.168.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.169.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.169.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.169.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.170.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.170.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.170.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.171.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.171.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.171.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.172.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.172.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.172.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.173.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.173.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.173.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.174.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.174.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.174.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.175.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.175.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.175.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.176.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.176.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.176.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.177.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.177.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.177.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.178.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.178.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.178.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.179.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.179.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.179.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.180.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.180.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.180.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.181.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.181.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.181.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.182.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.182.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.182.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.183.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.183.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.183.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.184.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.184.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.184.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.185.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.185.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.185.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.186.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.186.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.186.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.187.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.187.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.187.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.188.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.188.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.188.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.189.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.189.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.189.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.190.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.190.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.190.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.191.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.191.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.191.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.192.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.192.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.192.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.193.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.193.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.193.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.194.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.194.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.194.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.195.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.195.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.195.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.196.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.196.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.196.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.197.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.197.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.197.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.198.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.198.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.198.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.199.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.199.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.199.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.200.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.200.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.200.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.201.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.201.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.201.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.202.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.202.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.202.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.203.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.203.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.203.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.204.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.204.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.204.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.205.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.205.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.205.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.206.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.206.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.206.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.207.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.207.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.207.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.208.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.208.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.208.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.209.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.209.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.209.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.210.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.210.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.210.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.211.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.211.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.211.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.212.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.212.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.212.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.213.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.213.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.213.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.214.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.214.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.214.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.215.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.215.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.215.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.216.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.216.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.216.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.217.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.217.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.217.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.218.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.218.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.218.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.219.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.219.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.219.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.220.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.220.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.220.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.221.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.221.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.221.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.222.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.222.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.222.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.223.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.223.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.223.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.224.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.224.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.224.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.225.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.225.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.225.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.226.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.226.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.226.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.227.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.227.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.227.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.228.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.228.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.228.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.229.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.229.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.229.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.230.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.230.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.230.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.231.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.231.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.231.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.232.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.232.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.232.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.233.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.233.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.233.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.234.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.234.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.234.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.235.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.235.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.235.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.236.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.236.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.236.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.237.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.237.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.237.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.238.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.238.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.238.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.239.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.239.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.239.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.240.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.240.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.240.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.241.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.241.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.241.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.242.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.242.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.242.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.243.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.243.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.243.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.244.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.244.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.244.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.245.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.245.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.245.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.246.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.246.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.246.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.247.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.247.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.247.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.248.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.248.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.248.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.249.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.249.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.249.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.250.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.250.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.250.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.251.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.251.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.251.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.252.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.252.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.252.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.253.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.253.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.253.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.254.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.254.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.254.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.255.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.255.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.255.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.input_layernorm.weight": "model-00160-of-000163.safetensors", + "model.layers.60.post_attention_layernorm.weight": "model-00160-of-000163.safetensors", + "model.norm.weight": "model-00160-of-000163.safetensors", + "lm_head.weight": "model-00160-of-000163.safetensors", + "model.layers.61.self_attn.q_a_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.61.self_attn.q_a_layernorm.weight": "model-00160-of-000163.safetensors", + "model.layers.61.self_attn.q_b_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.61.self_attn.kv_a_proj_with_mqa.weight": "model-00160-of-000163.safetensors", + "model.layers.61.self_attn.kv_a_layernorm.weight": "model-00160-of-000163.safetensors", + "model.layers.61.self_attn.kv_b_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.61.self_attn.o_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.61.mlp.gate.weight": "model-00160-of-000163.safetensors", + "model.layers.61.mlp.gate.e_score_correction_bias": "model-00160-of-000163.safetensors", + "model.layers.61.mlp.shared_experts.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.61.mlp.shared_experts.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.61.mlp.shared_experts.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.61.mlp.experts.0.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.0.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.0.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.1.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.1.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.1.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.2.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.2.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.2.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.3.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.3.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.3.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.4.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.4.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.4.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.5.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.5.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.5.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.6.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.6.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.6.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.7.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.7.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.7.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.8.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.8.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.8.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.9.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.9.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.9.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.10.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.10.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.10.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.11.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.11.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.11.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.12.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.12.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.12.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.13.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.13.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.13.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.14.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.14.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.14.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.15.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.15.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.15.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.16.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.16.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.16.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.17.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.17.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.17.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.18.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.18.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.18.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.19.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.19.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.19.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.20.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.20.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.20.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.21.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.21.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.21.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.22.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.22.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.22.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.23.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.23.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.23.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.24.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.24.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.24.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.25.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.25.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.25.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.26.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.26.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.26.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.27.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.27.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.27.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.28.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.28.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.28.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.29.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.29.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.29.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.30.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.30.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.30.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.31.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.31.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.31.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.32.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.32.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.32.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.33.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.33.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.33.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.34.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.34.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.34.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.35.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.35.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.35.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.36.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.36.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.36.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.37.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.37.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.37.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.38.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.38.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.38.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.39.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.39.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.39.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.40.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.40.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.40.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.41.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.41.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.41.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.42.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.42.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.42.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.43.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.43.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.43.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.44.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.44.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.44.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.45.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.45.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.45.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.46.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.46.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.46.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.47.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.47.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.47.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.48.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.48.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.48.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.49.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.49.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.49.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.50.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.50.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.50.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.51.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.51.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.51.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.52.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.52.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.52.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.53.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.53.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.53.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.54.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.54.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.54.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.55.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.55.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.55.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.56.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.56.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.56.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.57.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.57.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.57.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.58.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.58.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.58.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.59.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.59.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.59.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.60.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.60.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.60.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.61.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.61.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.61.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.62.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.62.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.62.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.63.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.63.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.63.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.64.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.64.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.64.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.65.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.65.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.65.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.66.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.66.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.66.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.67.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.67.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.67.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.68.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.68.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.68.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.69.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.69.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.69.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.70.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.70.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.70.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.71.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.71.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.71.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.72.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.72.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.72.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.73.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.73.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.73.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.74.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.74.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.74.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.75.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.75.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.75.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.76.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.76.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.76.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.77.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.77.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.77.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.78.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.78.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.78.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.79.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.79.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.79.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.80.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.80.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.80.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.81.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.81.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.81.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.82.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.82.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.82.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.83.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.83.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.83.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.84.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.84.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.84.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.85.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.85.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.85.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.86.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.86.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.86.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.87.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.87.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.87.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.88.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.88.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.88.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.89.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.89.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.89.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.90.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.90.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.90.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.91.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.91.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.91.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.92.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.92.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.92.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.93.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.93.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.93.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.94.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.94.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.94.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.95.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.95.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.95.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.96.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.96.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.96.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.97.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.97.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.97.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.98.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.98.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.98.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.99.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.99.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.99.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.100.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.100.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.100.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.101.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.101.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.101.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.102.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.102.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.102.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.103.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.103.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.103.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.104.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.104.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.104.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.105.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.105.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.105.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.106.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.106.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.106.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.107.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.107.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.107.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.108.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.108.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.108.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.109.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.109.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.109.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.110.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.110.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.110.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.111.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.111.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.111.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.112.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.112.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.112.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.113.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.113.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.113.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.114.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.114.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.114.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.115.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.115.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.115.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.116.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.116.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.116.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.117.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.117.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.117.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.118.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.118.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.118.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.119.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.119.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.119.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.120.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.120.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.120.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.121.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.121.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.121.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.122.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.122.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.122.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.123.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.123.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.123.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.124.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.124.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.124.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.125.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.125.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.125.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.126.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.126.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.126.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.127.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.127.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.127.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.128.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.128.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.128.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.129.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.129.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.129.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.130.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.130.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.130.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.131.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.131.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.131.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.132.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.132.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.132.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.133.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.133.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.133.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.134.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.134.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.134.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.135.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.135.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.135.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.136.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.136.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.136.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.137.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.137.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.137.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.138.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.138.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.138.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.139.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.139.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.139.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.140.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.140.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.140.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.141.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.141.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.141.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.142.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.142.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.142.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.143.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.143.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.143.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.144.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.144.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.144.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.145.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.145.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.145.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.146.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.146.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.146.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.147.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.147.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.147.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.148.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.148.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.148.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.149.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.149.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.149.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.150.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.150.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.150.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.151.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.151.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.151.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.152.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.152.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.152.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.153.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.153.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.153.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.154.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.154.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.154.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.155.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.155.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.155.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.156.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.156.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.156.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.157.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.157.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.157.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.158.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.158.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.158.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.159.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.159.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.159.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.160.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.160.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.160.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.161.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.161.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.161.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.162.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.162.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.162.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.163.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.163.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.163.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.164.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.164.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.164.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.165.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.165.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.165.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.166.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.166.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.166.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.167.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.167.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.167.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.168.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.168.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.168.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.169.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.169.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.169.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.170.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.170.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.170.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.171.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.171.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.171.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.172.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.172.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.172.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.173.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.173.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.173.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.174.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.174.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.174.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.175.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.175.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.175.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.176.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.176.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.176.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.177.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.177.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.177.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.178.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.178.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.178.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.179.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.179.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.179.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.180.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.180.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.180.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.181.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.181.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.181.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.182.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.182.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.182.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.183.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.183.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.183.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.184.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.184.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.184.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.185.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.185.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.185.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.186.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.186.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.186.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.187.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.187.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.187.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.188.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.188.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.188.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.189.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.189.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.189.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.190.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.190.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.190.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.191.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.191.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.191.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.192.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.192.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.192.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.193.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.193.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.193.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.194.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.194.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.194.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.195.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.195.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.195.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.196.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.196.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.196.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.197.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.197.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.197.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.198.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.198.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.198.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.199.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.199.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.199.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.200.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.200.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.200.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.201.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.201.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.201.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.202.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.202.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.202.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.203.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.203.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.203.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.204.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.204.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.204.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.205.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.205.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.205.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.206.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.206.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.206.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.207.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.207.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.207.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.208.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.208.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.208.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.209.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.209.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.209.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.210.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.210.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.210.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.211.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.211.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.211.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.212.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.212.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.212.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.213.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.213.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.213.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.214.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.214.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.214.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.215.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.215.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.215.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.216.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.216.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.216.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.217.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.217.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.217.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.218.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.218.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.218.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.219.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.219.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.219.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.220.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.220.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.220.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.221.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.221.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.221.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.222.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.222.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.222.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.223.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.223.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.223.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.224.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.224.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.224.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.225.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.225.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.225.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.226.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.226.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.226.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.227.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.227.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.227.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.228.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.228.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.228.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.229.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.229.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.229.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.230.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.230.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.230.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.231.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.231.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.231.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.232.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.232.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.232.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.233.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.233.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.233.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.234.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.234.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.234.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.235.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.235.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.235.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.236.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.236.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.236.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.237.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.237.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.237.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.238.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.238.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.238.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.239.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.239.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.239.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.240.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.240.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.240.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.241.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.241.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.241.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.242.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.242.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.242.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.243.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.243.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.243.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.244.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.244.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.244.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.245.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.245.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.245.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.246.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.246.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.246.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.247.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.247.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.247.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.248.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.248.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.248.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.249.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.249.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.249.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.250.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.250.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.250.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.251.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.251.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.251.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.252.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.252.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.252.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.253.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.253.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.253.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.254.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.254.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.254.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.255.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.255.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.255.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.input_layernorm.weight": "model-00163-of-000163.safetensors", + "model.layers.61.post_attention_layernorm.weight": "model-00163-of-000163.safetensors", + "model.layers.61.embed_tokens.weight": "model-00163-of-000163.safetensors", + "model.layers.61.enorm.weight": "model-00163-of-000163.safetensors", + "model.layers.61.hnorm.weight": "model-00163-of-000163.safetensors", + "model.layers.61.eh_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.shared_head.norm.weight": "model-00163-of-000163.safetensors", + "model.layers.61.shared_head.head.weight": "model-00163-of-000163.safetensors" + } +} \ No newline at end of file